Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_arg_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P E Q P S R N V Y E S A P Q R V L S R V V A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V L E Q Q G V E L G P R E R Q E I E Y I V A E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P R P E L G D Y G I P A A R Y A K R Y G I D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I F F K K A T A L L Q Q E P V V A E A K R V G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y L N I T I D V G Y A A K L V F E A V R A E G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E Y G R V K T E K P E R I V V E H T S A N P V H
- - - - - - - - - - - - - V V E H . S A N P V H
---------------------------------------GTAGTTGAGCAT---AGTGCTAACCCTGTACAT
145146147148149150151152153154155156157158159160161162163164165166167168
P L H I G H A R N A S L G D S L A R L L R A R G
P L H I G H A R N A S L G D S L A R L - - - - -
CCCCTCCATATAGGCCATGCGAGAAACGCGAGCTTGGGTGATTCCCTGGCTAGACTG---------------
169170171172173174175176177178179180181182183184185186187188189190191192
H V V Q T R F Y I N D M G R Q V A V L A Y G Y I
- - - Q T R F Y I N D M G - - - - - - - - - - -
---------CAGACACGGTTCTACATAAACGACATGGGA---------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A A G L D K P P K D V K P D H W I G L V Y A I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H T L S D I E E L K K R L E Q L K Q E E K Y E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y R Q L L R E L D E L V A T A S R L R E R D P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L F E R I A E A L K G K D P S Q E I S K L M Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y E Y R Q D P E K V E L V R K V V Q L C L Q G F
- - - - - - - - - - - - - - - - - Q L C L Q G F
---------------------------------------------------CAACTATGCCTCCAGGGCTTC
313314315316317318319320321322323324325326327328329330331332333334335336
R E T L S R L G I E I E K W D W E S E L A W T S
R E T L S R L . . E - - K W D W E S E - - - - -
CGTGAAACGCTCTCAAGGCTC------GAG------AAATGGGACTGGGAAAGCGAG---------------
337338339340341342343344345346347348349350351352353354355356357358359360
M V S K I L E Q A R S S P Y A T V H K G A L A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N L Q P L L R D P V V R E R L G L P E D Y E I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P L I L Q R S D G T T L Y T T R D I A Y S I K K
- - - - - - - - - - - L Y T T R D I A Y S I - -
---------------------------------CTATACACCACCAGAGACATAGCATACAGTATC------
409410411412413414415416417418419420421422423424425426427428429430431432
F R E F N A D R V F N V I A A E Q R L E Q L Q V
- - - - - - - - - F N V I A A E Q R L E Q L Q V
---------------------------TTCAATGTAATAGCCGCAGAGCAGAGACTAGAACAGCTACAAGTA
433434435436437438439440441442443444445446447448449450451452453454455456
R L A L I A L G Y R R E G L N M I H Y A Y E M V
R L A L I A L - - - - - - - - M I H Y A Y - - -
AGGCTAGCACTCATAGCGCTC------------------------ATGATACACTATGCCTAC---------
457458459460461462463464465466467468469470471472473474475476477478479480
N L P G Q K M S G R R G R Y I T L D E L I D Q A
- - - - - K M S G R - - - - - - - - - - - - - -
---------------AAGATGAGCGGCCGG------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V A I A R Q E V E K R S P G L P E E E K Q K I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E A V G T A A V R Y T L V S V S A P K P M T F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I N E A L N F E R N S A P Y I L Y T H A R A A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I L A K A R E R G I Q L D W D R I D Y S A A N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N M L R R S L V I Q A L V Y P Y V F A K A A D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q R P E L I V A Y L N R L A D I F N R W Y T S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D S V V N E Q D Q G K Q M F K L A L V Y A V K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665
I L A N A L D L L G I K A I D R M
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_arg_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N P I R S V K E E F C E I V A N G L G I S K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A I F K T I E Y P P R E E L G D I S L P L P S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K L N V R T E V T F S R G K L I K E V R K T G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y V N A F I D E K E L F K L L F T E M Q D N Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V E K T E N P K R I V V E H T S A N P I H P L H
- - - - - - - - - - V V E H . S A N P I H P L H
------------------------------TAATATATTGTA---TCTAGCATAGGTATATTGGAGATATGG
121122123124125126127128129130131132133134135136137138139140141142143144
I G H L R N S I L G D T I S R M L K I R G H D V
I G H L R N S I L G D T I S R M - - - - - - - -
GCCGCTGTTCTGTTCAAAATCTACTATGTTATTAATATTAAATGTTAC------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N R R F Y V N D A G R Q V A I L T L G Y I L L G
N R R F Y V N D A G - - - - - - - - - - - - - -
TATTGCGTATCTTATCGCTGAATTAACTAT------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E P E P S P K V D H W F G L I Y S I T N V I I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I R E L K E E L K K D L D P D T Y K D K I N R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D E L V A T A Q S L R E R N P E F F D K L A D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I N S I P D V E S E I Q K I I K S Y E K G D D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K I K Q I V R K I V N L N L D G F R E S L D K L
- - - - - - - - - - N L N L D G F R E S L D K L
------------------------------ACCTTTCGGTATGTTAAGAATTTCCTTTATTTTCTCGTTAAT
289290291292293294295296297298299300301302303304305306307308309310311312
E I S F D V Y D Y E S E L L W S G M V D E V L S
. . . . D V Y D Y E S E - - - - - - - - - - - -
------------GAGAGCCTTAGTTCCCTTATAGTC------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K A F Q I A K D Y K G T K A L E L E D I N E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K E I L N I P K G L K L P P L V L T R S D G T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L Y T T R D I A Y T V K K F S D F K A D T V I N
L Y T T R D I A Y T V - - - - - - - - - - - I N
CTCATAACTCTTTATAATTTTTTGGATTTCACT---------------------------------TAATTT
385386387388389390391392393394395396397398399400401402403404405406407408
V I A E Q Q S I P Q M Q L R A S L Y L L G Y E R
V I A E Q Q S I P Q M Q L R A S L Y L L - - - -
ATCAAAGAATTCAGGGTTTCTTTCTCTTAATGATTGAGCAGTAGCTACAAGTTCATCAAG------------
409410411412413414415416417418419420421422423424425426427428429430431432
L A Q N L V H Y S Y G M V N L Q G M R M S G R L
- - - - L V H Y S Y - - - - - - - - R M S G R -
------------ATCAGGATCTAAATCTTT------------------------TATTTCTATTATAAC---
433434435436437438439440441442443444445446447448449450451452453454455456
G R F I S L D D V I E K V S E V A K K K I E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S G D I S N L R D I V N S A I R Y A I L S V A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N K P V T F N I N N I V D F E Q N S G P Y L Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T Y A R A Y N I L A K N Q D E I K L N D A D L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D L I G D K R R L L L L I A R F P E T F N K A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D E L R P E D L I D F L R R T A D V F N R W Y N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
F E R V L Q E P D Y R K R I T R L F I V K G I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618
R V L Y N G L N P L G I K P L S R M
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_arg_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y R T T C D A I A A I L R Q H T G K E D V M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T D G G D H A D V A S T I A F S L A K E L R K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P A I I A Q E I A G A I S D Q V M A E T G A E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R A V G P Y V N F I F G A E Y C M N V L E Q A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R E G Y G K G Q E K S E R V V L E H T S A N P N
- - - - - - - - - - - - - - V L E H . S A N P N
------------------------------------------GTTCTGGAGCAC---TCTGCAAACCCGAAC
121122123124125126127128129130131132133134135136137138139140141142143144
G P L H V G H I R N T I I G D T L A R C F R K A
G P L H V G H I R N T I I G D T L A R C - - - -
GGCCCCCTTCATGTCGGGCATATCAGAAACACTATAATCGGCGATACGCTGGCCAGATGC------------
145146147148149150151152153154155156157158159160161162163164165166167168
G Y P L E V Q Y Y V N D M G R Q I A I V A W G I
- - - - E V Q Y Y V N D M G - - - - - - - - - -
------------GAAGTCCAATACTATGTCAATGACATGGGC------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A T Q G A D I H A E G K G D H L I A D V Y I E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N R H L E K E P A L N A E I D R L M Q L V E S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D P D T I S Q F K I P V K R C L D G F K D T L A
- - - - - - - - - I P V . . . L D G F K D T L A
---------------------------ATCCCGGTG---------CTGGACGGATTTAAAGATACCCTTGCC
241242243244245246247248249250251252253254255256257258259260261262263264
A M H V K H D R F I Y E S D F I R N G D T A K V
A M . . . . D R F I Y E S D - - - - - - - - - -
GCCATG------------GACCGGTTTATCTATGAGAGTGAC------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L S R I S H L P E A R I E E T L S L D L S A F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F E K N Y I L R R S D G T S V Y A A R D I A F H
- - - - - - - - - - - - - - V Y A A R D I A F H
------------------------------------------GTATATGCCGCGCGTGACATTGCCTTCCAC
313314315316317318319320321322323324325326327328329330331332333334335336
I W K G H N F D R V I D V L G A D H K L I G T Q
I - - - - - - - - - I D V L G A D H K L I G T Q
ATC---------------------------ATCGATGTCCTGGGTGCTGATCACAAACTTATCGGGACTCAG
337338339340341342343344345346347348349350351352353354355356357358359360
L Q A T L E I L G E R V P E I V F F E F V S L P
L Q A T L E I L - - - - - - I V F F E F - - - -
CTGCAGGCAACCCTTGAGATTCTG------------------ATAGTCTTCTTCGAGTTT------------
361362363364365366367368369370371372373374375376377378379380381382383384
E G S M S T R K G K F I S A D E L I A E T E R R
- - S M S T R - - - - - - - - - - - - - - - - -
------TCGATGAGTACCCGG---------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A M E E V T A R R S E L S E E E R K K I A H S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A I S A I R Y D I I R T I P E K S T V F D W K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A L D F E K Q S G P Y I Q Y A H A R A C S I L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K A E S Y T P C F E A E G E G E I A L T K Q I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L F P K V I T E V V T E L K P H L L A I Y A R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L A D I F N S F Y H A E P V L R A E G K I R D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R L T L V D A T R N T L K E A L E T L G I D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555
R A M
- - -
---------
Class I
Archaea/Archaeoglobus fulgidus/amino acid sequences/arg_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F L R F I E E V I K A L G E Y G D K K F L R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S E H A D L A S T I A F K L A K E R K K S P K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I A D E I V E N L E V E S E Y I G S V E S V N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y I N F F A S Y E F L E D T V N V I L D E D E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y G H L N L K G E I L I E H T S A N P D G P L H
- - - - - - - - - - L I E H . S A N P D G P L H
------------------------------CTGATTGAACAC---TCAGCCAACCCCGACGGGCCCCTGCAC
121122123124125126127128129130131132133134135136137138139140141142143144
I G H I R N S I I G D T I A R I F A K A G F D V
I G H I R N S I I G D T I A R I - - - - - - - -
ATAGGTCACATAAGAAACTCCATAATAGGGGACACCATAGCGAGAATT------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K T H Y Y V N D M G R Q T A I T V L G I E K F G
K T H Y Y V N D M G - - - - - - - - - - - - - -
AAAACGCACTACTACGTAAACGACATGGGA------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L K D K K P D H A V A E A Y I E A N K L L E S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P E L E E Q V E K L M L A Y E E G D E K T V E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F R R A V E T A L E G I K Q T L K T I N V E H D
- - - - - E T A L E G I K Q T L K T I . . . . D
---------------GAGACGGCTTTAGAGGGTATAAAGCAAACTCTGAAGACGATT------------GAC
241242243244245246247248249250251252253254255256257258259260261262263264
E F V W E S E F V R N G Y V G K V L G I L E E R
E F V W E S E - - - - - - - - - - - - - - - - -
GAGTTTGTTTGGGAGAGTGAG---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G L V K K N G A W S I E L E G F D K E V V L R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E N G T T L Y I T R D L A Y H M W K N E N Y E R
- - - - - L Y I T R D L A Y H M - - - - - - - -
---------------CTCTACATCACCAGAGACCTCGCTTATCACATG------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F I N V L G A D H K L Y G A Q L S K I L E L L G
- I N V L G A D H K L Y G A Q L S K I L E L L -
---ATAAACGTTCTTGGGGCAGACCACAAGCTTTACGGCGCTCAGCTGTCGAAAATTCTTGAGCTTCTC---
337338339340341342343344345346347348349350351352353354355356357358359360
L K P P E I I F F E F V S L P E G S M S T R R G
- - - - - I I F F E F - - - - - - S M S T R - -
---------------ATAATCTTTTTCGAGTTC------------------AGCATGAGCACGAGG------
361362363364365366367368369370371372373374375376377378379380381382383384
K F I S A D E L I S K V R D E A W K I L S E R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
M E E D E K R K I A D A V A V G A I R F D F I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I A P E K H M T F D W S K A L D F E R Q T A S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I Q Y S H A R A C S I L R K A V E D G M P E L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F K G E L C T A G E R K L V M L L S K M P Y V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K R I V S E L R P N V F A E Y L L S V A G T F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D F Y R D H P V L K A E S E V R M H R L A I V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549
A T R V V L R N G L E L L G I E P L E R M
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_arg_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F R Y I E K E A R D S I T A A L E K L G I K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P P E I K L E E P P N P Q L G D L A S T V S F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L A G K L R R A P I E I T A D I M S V I E T P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I F E T I E S K G P Y I N F F V D Y G R F S S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L L E S I Q D D Y G S H P P R D E R V I L E H T
- - - - - - - - - - - - - - - - - - - I L E H .
---------------------------------------------------------GGATGCACAGCC---
121122123124125126127128129130131132133134135136137138139140141142143144
S A N P N G P L H I G H I R N A I I G D S L A R
S A N P N G P L H I G H I R N A I I G D S L A R
CTCAAAGCTGAGGGCATCATCCCACCGGAATACGATGTGCTTCTCGGGTGAGAGCCTTGCTATGTAGTACCT
145146147148149150151152153154155156157158159160161162163164165166167168
I L R M A G Y D V E T Q Y Y V N D M G R Q I A M
I - - - - - - - - E T Q Y Y V N D M G - - - - -
TAT------------------------AATATCATCTGCAACATCATCGGGAAGATC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
I V W G L L N L D G D L E D Y P G D K M D H R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G K L Y F E V N Q R L K E N P G I R D E V D E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I R K Y E A G E N E E L F R K V V E Y C L S G M
- - - - - - - - - - - - - - - - - E Y C L S G M
---------------------------------------------------GATGATAACATCCCCCTCCTC
241242243244245246247248249250251252253254255256257258259260261262263264
E E T M K R L H V H H D R F V W E G Q F V R D G
E E T M K R L . . . . D R F V W E G Q - - - - -
TGACTTCTGGAGGTGGTAGGC------------TGAGTAGAGGGAGGTTCCATCTGA---------------
265266267268269270271272273274275276277278279280281282283284285286287288
T V D R V I E S L R K T G Y T G E N D V L Y L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L E E F G L E K E L V L T R S D G T S L Y S T R
- - - - - - - - - - - - - - - - - - - L Y S T R
---------------------------------------------------------GAAGCGGTCGTGGTG
313314315316317318319320321322323324325326327328329330331332333334335336
D I A Y H L Q K S E E G D V I I D V L G S D H K
D I A Y H L - - - - - - - - - I D V L G S D H K
AACGTGGAGCCTTTTCAT---------------------------CTCAACAACCTTCCTGAATAGCTCCTC
337338339340341342343344345346347348349350351352353354355356357358359360
L A A E Q V G I A V E L L G G K R P E V I F Y E
L A A E Q V G I A V E L L - - - - - - V I F Y E
GTTCTCCCCTGCCTCATACTTCCTTATTAGTTCATCCAC------------------ATTTTCCTTTAGCCT
361362363364365366367368369370371372373374375376377378379380381382383384
F I T L P E G S M S T R R G V F I S V D E L M D
F - - - - - - S M S T R - - - - - - - - - - - -
CTG------------------TTTACCTACCCTGTG------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E A H S R A L H E V K K R R D L P D D V A D D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A E S I G N G A I R Y Y I A R L S P E K H I V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R W D D A L S F E R G C A S I Q Y A H A R A C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L L E K A S F T G E E D I E D G W K P E G D E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E L V R L L A R F P V V V E E S A L A R R V H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V A Q Y A Q D L A N T F N S F Y R S T P V I G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D F E G A R L R L V D S V R K T L R N A L N L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560
G I H A P E T M
- - - - - - - -
------------------------
Class I
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_arg_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D P L R Q P R E E F V K V L G E V S R E L G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P E V P E V E R T R R Y G F F S A R F H K Y K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D H S R L A E V V N L I K N K R F E F L S S L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V D G L Y L N A D L N V S K V A E L V F E A V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K M G R K Y G F T E E C V T G S Y L V E H T S A
- - - - - - - - - - - - - - - - - L V E H . S A
---------------------------------------------------TTGGAGAAATGT---TGAATT
121122123124125126127128129130131132133134135136137138139140141142143144
N P V H P L H I G H G R N A I L G D S L A R L L
N P V H P L H I G H G R N A I L G D S L A R L -
CTGTCTTAGGTTTAGCACGACGTCCCATTTGAATTCAATTGGCTTGCGCGGGCTTGTGGTAAGAAAGGC---
145146147148149150151152153154155156157158159160161162163164165166167168
K F C G N K V E T H F Y V D D C G V Q V M Y A A
- - - - - - - E T H F Y V D D C G - - - - - - -
---------------------TCTTTCCGCAATTACTCCGCTCACCTCTGG---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
M G Y N A V K D E V K K R I E K S K P D V V I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
H V Y S A T N A V A E I G R L K K E L E K A Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D E R K R E I L R E I D E W V A V L K R L M D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E G D I I S K I A E E L G R R D L L N E A V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N R R Y E S G D P E A K G V V R E V V D L V L K
- - - - - - - - - - - - - - - - - - - D L V L K
---------------------------------------------------------TTGGACAAATTTATC
289290291292293294295296297298299300301302303304305306307308309310311312
G Q R E T L A R L G V E I D K W D Y E S E L T V
G Q R E T L A R L . . . . D K W D Y E S E - - -
AGCGCGAAAAACAACTGCGCCGCCCTT------------CTGAGGCCACCTCTTCTGGAGCTC---------
313314315316317318319320321322323324325326327328329330331332333334335336
W S S E A M R I V S E L Q K R W P Q Y I E I K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G A V V F R A D K F V Q D Y N L W D V L D L P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F I P P V T L T R S D G T T L Y V T R D V A Y A
- - - - - - - - - - - - - - L Y V T R D V A Y A
------------------------------------------GAGATCCCTCCGTCCCAGCTCCTCTGCGAT
385386387388389390391392393394395396397398399400401402403404405406407408
L W Q A R Q G F D K V I R V I S T E Q T H E Q A
L - - - - - - - - - - I R V I S T E Q T H E Q A
CTT------------------------------CCTTTTTAAAACGGCGACCCACTCATCAATCTCTCTCAA
409410411412413414415416417418419420421422423424425426427428429430431432
H V R I I L Y A L G Y V D E A K K I V H Y A Y E
H V R I I L Y A L - - - - - - - - I V H Y A Y -
AATCTCTCTTTTCCTCTCATCGTCTTG------------------------TCTGCCTATCTCAGCCAC---
433434435436437438439440441442443444445446447448449450451452453454455456
M V N L P G M K M S A R R G Q Y I S L D E I L D
- - - - - - - K M S A R - - - - - - - - - - - -
---------------------GCCGATGACAACATC------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E A A E R S A S L V K E K N P E V S G V I A E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V G V G S V R Y A F L T T S P R K P I E F K W D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V V L N L R Q N S G T F L Q Y T Y V R A Y S I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E K A G E I G N V P V P E N M L A E E R E L V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K I A E W P S V V K E A A K S L R P D Y V A E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L D G L A L V F N S Y Y E K A P V L K A E E S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R G F R I A I V N A V K T V L E A G F Y I L G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630
P T L T K M
- - - - - -
------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_arg_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L L F Q D L R K D I Y E I V S K R F R I S E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D V Y L D D T G H S D I T I R V F R I L K S P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G G E N A V M E I V R S I S E K D Y V E K A L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E G G Y I N V W I K R T Y M L R E V L E S I E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S G T Y P D V F Q E A E R V S V E H T S A N P T
- - - - - - - - - - - - - - S V E H . S A N P T
------------------------------------------CGAATACATTAT---AGGCGCAGAATTGGA
121122123124125126127128129130131132133134135136137138139140141142143144
G P L H I G R A R N S I I G D S I Y R I L S R Y
G P L H I G R A R N S I I G D S I Y R I - - - -
TTCAAAGTTGAGCGCCTCCTCCCACCTGAACGTTATGGGCTTTGGTGCGCTCACCCTGAT------------
145146147148149150151152153154155156157158159160161162163164165166167168
G Y R T V R Q Y F V N D S G K Q M I S L Y T A Y
- - - - V R Q Y F V N D S G - - - - - - - - - -
------------GGCGATCACCTCAGCTATTTTTTTGCGTTC------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I K Y G G P I T I E N L L E N Y Q K I Y R E M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K D Q S I E K E I E K N I E R Y E N A D P E V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G T L R K I A G V M L D G I A S T L K R I G I E
- - - - K I A G . . . D G I A S T L K R I . . .
------------GTGGTTCAGCGA---------ATCCTTATGATCTTCACCGAGAACGTCTAT---------
241242243244245246247248249250251252253254255256257258259260261262263264
F D E F D W E S D L L L N G S V R K A I D M L E
. D E F D W E S D - - - - - - - - - - - - - - -
---GTTTTCTGCCTTGAAGAGGTGGTA---------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T K E E D S A R Y I E I S G K K V F L T R K D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T T L Y F A R D I A Y H L F K A E N S E W I I D
- - L Y F A R D I A Y H L - - - - - - - - - I D
------CCTCACGCTGCCGTTGAGAAGAAGATCAGATTC---------------------------GATCCT
313314315316317318319320321322323324325326327328329330331332333334335336
V L G E D H K D H A K S L N H V L K E M L K L E
V L G E D H K D H A K S L N H V L K E M - - - -
CTTGAGCGTTGAGGCGATGCCGTCAAGCATGACGCCCGCAATTTTCCTCAGTGTTCCGAA------------
337338339340341342343344345346347348349350351352353354355356357358359360
N R V S F M Y Y S F I T L E T G K M S T R R G N
- - V S . . . . . . . . . E . . . . . . . . . .
------CTCGTA---------------------------CTC------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I V T L Q D L V D R T Y D E A L K I V N E K R P
. . . L Q . . . . . . Y - - - - - - - - - - - -
---------GTAATT------------------TGT------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D L S E E E R K K I A E V I A S S A V R Y S I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R V S A P K P I T F R W E E A L N F E S N S A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F I M Y S H A R A A S I L D K A P E P E Q S Y G
- - - - - - - - - - - - - - - - - - - - - S . .
---------------------------------------------------------------AAT------
457458459460461462463464465466467468469470471472473474475476477478479480
M D M P K E E A D L V K A M Y V Y P Y Y L K D A
. . . . . . . . . . . . . M . . . . . . . . . .
---------------------------------------ATT------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A Q D L K P D L I A A Y L I S L V Q K F N D F Y
. . . . . . . . . . . . . . S . . . . . . . . .
------------------------------------------GGC---------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G A C R V I G T D P L T Y A R R I R I V K A Y K
. . . . . . . . . . . T . . R - - - - - - - - -
---------------------------------ACC------ATC---------------------------
529530531532533534535536537538539540541542543544545546
Q I L S D A G D L I G I K M L D Q M
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_arg_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K A Y I E E A L R Q V L R T I D G V P E D F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P E L E K P N N P E H G D L A T N A A M Q L A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y L K R P P R Q I A E E I A E R L R A L P L D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R R V A S V E V A G P G F L N F R F A P D Y L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q V L A D I L A A G E R Y G R S D L G Q G R P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I V E Y V S A N P T G P L T V G H G R N A V L G
I V E Y . S A N P T G P L T V G H G R N A V L G
GTAAAAGACCGG---CTTCTCGCTGGCCTCACGGGCCAGATCCAGATCGAACTCCAGGTGCGTGTTGGGCGA
145146147148149150151152153154155156157158159160161162163164165166167168
D T I A N L L D W I G Y R V T R E Y Y Y N D A G
D T I A N L - - - - - - - - T R E Y Y Y N D A G
GCGCATCAGGAAGAAAAA------------------------GTCGATCAGTTCGTCGAGCGTCACGTAGGT
169170171172173174175176177178179180181182183184185186187188189190191192
R Q M R V L G E S V R A R Y L A L V D P N L P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K K I Q A A E G E W V E V P E P F P E D G Y L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D Y I I D I A R M L Y E Q H G E A L R D V E D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T P F K E A A E K V I F E D I R R T L A R L G I
- - - - - - - - K V I F E D I R R T L A R L . .
------------------------GACCAGCACCGTATCCTGATCTTTGCCCAGCGCACTCGTGCG------
265266267268269270271272273274275276277278279280281282283284285286287288
H M D S Y F N E H T L Y E N G K I W E V V E A L
. . D S Y F N E H T - - - - - - - - - - - - - -
------GCCGTCTTTTTCGTAGATGTAGCC------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R A K G Y I Y E K D G A V W F R T S A L G K D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D T V L V K R T G E P T Y R L P D I A Y H I T K
- - - - - - - - - - - T Y R L P D I A Y H I - -
---------------------------------CGGCGTGATGTCTTCCACGTCGCGGAGCGCCTC------
337338339340341342343344345346347348349350351352353354355356357358359360
F E R G F E R I V D V F G A D H I A T Y P D V L
- - - - - - - - V D V F G A D H I A T Y P D V L
------------------------GTCGATGATGTAGTCGCCCAGGTAGCCGTCCTCGGGGAAGGGCTCGGG
361362363364365366367368369370371372373374375376377378379380381382383384
R A L E V L G Y D V S K V D V V I Y Q F V T L V
R A L E V L - - - - - - V D V V I Y - - - - - -
CACCTCCACCCATTCGCC------------------TTTGGTGGGCAGGTTTGG------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R G G E P V K M S T R K A T Y V T L D E L I D E
- - - - - - K M S T R - - - - - - - - - - - - -
------------------GCCCAGCACGCGCAT---------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V G E D V T R F F F L M R S P N T H L E F D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L A R E A S E K N P V F Y L Q Y A H A R I C S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
M R K A D E V G L K E S P N P D L T L L Q H E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E Q A L I K E L M R F P E V I Q E A A Q T Y E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H R V A N Y L R E V A V A F T K F Y D H C R I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G E P E P L A Q A R L A L A R A A R L V L A N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564
L R V L G I S A P E R M
- - - - - - - - - - - -
------------------------------------
Class I
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_arg_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R E L L D N R L Q F N G E A Y I I K D S P L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S Y V K E L E K V G H K Y R V I F D I E K V I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y L E N P P T Y K K N Q T Y V L D Y F S P N I G
- - - - - - - - - - - - - - V L D Y . S P N I G
------------------------------------------GTTTTAGATTAC---TCTCCAAACATCGGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K P P H V G N L R S A I I G N P L K N I L R K V
K P P H V G N L R S A I I G N P L K N I - - - -
AAACCCCCACATGTTGGTAACCTAAGAAGTGCCATTATTGGGAACCCATTAAAAAATATA------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G Y N V I S I N W W G D F G T Q F G E L I Y A F
- - - - I S I N W W G D F G - - - - - - - - - -
------------ATATCTATTAATTGGTGGGGGGATTTTGGC------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K T K G D E K E L R K N P I K H L F E L Y T W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N R E L E K N P E I K N Y A R E E F K Y L E E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
M Y K G I Q I D V S P F F E G K P L S E L L K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K T R E E Q N Y I L W K I F R E I T I K Y M R E
- - - - - - - - - - - - - - - E I T I K Y M R .
---------------------------------------------GAAATAACTATAAAATATATGCGA---
217218219220221222223224225226227228229230231232233234235236237238239240
Q F Y P K L K L E F D E E S G E S F F L K K A K
Q F Y P K L . . . . D E E S G E S F - - - - - -
CAATTTTATCCAAAACTA------------GATGAAGAGAGCGGGGAATCCTTC------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E V A K E L L E K G V A E E D K N S I I V R T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y G V A L L L K S D G T T L Y L T R D L A A A I
- - - - - - - - - - - - - L Y L T R D L A A A I
---------------------------------------TTGTATTTAACTAGGGATTTAGCTGCGGCTATA
289290291292293294295296297298299300301302303304305306307308309310311312
E H Y E K Y K F D K K I Y V V A N E Q S Q H F N
- - - - - - - - - - - I Y V V A N E Q S Q H F N
---------------------------------ATCTATGTAGTAGCGAATGAGCAATCGCAACATTTTAAT
313314315316317318319320321322323324325326327328329330331332333334335336
Q L I Y I A K K A N Y P F A D K L Y H L K F G L
Q L I Y I A K K A N Y . . . . . . . . . . . . .
CAATTAATTTATATAGCTAAGAAAGCCAATTAT---------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L L L K T E E G V K K F S T R K G R A V F A E D
. . . . . . . . V K K F - - - - - - - - - - - -
------------------------GTAAAAAAGTTC------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I L E K A Y E L A K E E I L K R N K D K P L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I E K N A K I I G Y G A V I Y A I V R Y D P K K
- - - - - - - - - - - - - - - - - - - - - - - K
---------------------------------------------------------------------AAA
409410411412413414415416417418419420421422423424425426427428429430431432
D I I F D W D K I L S L N G K T S V F I Q Y S A
. . . F . . . . . . S . . . . T . . . . . . . .
---------TTT------------------TCT------------ACA------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V R A K H I L D K Y N K P I E R P N N L E K D E
. R - - - - - - - - - - - - - - - - - - - - - -
---AGG------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E R L L L W L F Y Y Y A V L E E S A R K L K P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I L A E Y L Y N L A E E F N R F Y E K N R V I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S N R E K E R V W L V N K T Y Q I L K E G L N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537
L G I D V P T F M
- - - - - - - - -
---------------------------
Class I
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_arg_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E Q N I T N I L I K K I E E L T E T I Y D E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I R L E E P P S I S L G D Y S T N I S F K L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L L K K S P M V I A E E L T N L L I S E N I E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I K E I K A V N G Y I N F F I D Y N L Y S K S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I A K I S S E K D K F G Q G A P K N K K V I I E
- - - - - - - - - - - - - - - - - - - - - I I E
---------------------------------------------------------------ATAATTGAA
121122123124125126127128129130131132133134135136137138139140141142143144
H T S A N P N G P L H I G H S R N A I V G D S L
H . S A N P N G P L H I G H S R N A I V G D S L
CAT---TCGGCTAACCCAAACGGACCACTCCATATAGGACACAGCAGAAATGCCATTGTTGGAGACAGCTTA
145146147148149150151152153154155156157158159160161162163164165166167168
K R I V E F A G Y V V E A Q Y Y V N D M G R Q E
K R I - - - - - - - - E A Q Y Y V N D M G - - -
AAAAGAATT------------------------GAGGCCCAATATTATGTAAATGATATGGGA---------
169170171172173174175176177178179180181182183184185186187188189190191192
A I V V Y G L D K F E L N E Q Q K P D H A I G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V Y F K A N Q L L N E N P E Q E E E I L K L M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K Y E E A S E K G E E N E L T N K F N Y A V N Y
- - - - - - - - - - - - - - - - - - - - - - N Y
------------------------------------------------------------------AATTAT
241242243244245246247248249250251252253254255256257258259260261262263264
A L S G F K E T L N N L N I H H D K F V W E S S
A L S G F K E T L N N L . . . . D K F V W E S S
GCCCTAAGTGGATTTAAAGAAACCCTTAATAACTTA------------GATAAATTTGTATGGGAGAGCTCC
265266267268269270271272273274275276277278279280281282283284285286287288
Y V K N G M V Q K V I Q T L K D T G K V E K D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V Y R L D L S E F G I D K K L V L A R L N G T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L Y S T R D I A Y H I D K M K N C D I G I N I L
L Y S T R D I A Y H I - - - - - - - - - I N I L
CTATACTCCACAAGAGATATTGCATATCATATT---------------------------ATTAATATTCTT
337338339340341342343344345346347348349350351352353354355356357358359360
G A D H K L T A E M V N A S L K L L G Y N T P E
G A D H K L T A E M V N A S L K L L - - - - - -
GGAGCTGACCACAAATTAACAGCAGAAATGGTAAATGCCAGTTTAAAATTGTTG------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V V F Y E F I S L P E G S M S T R R G T F I S I
V V F Y E . . . . . . . . . . . . . . . . . . .
GTAGTATTTTATGAA---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D E L Y E E A K N R A V K E I K K R N E T T E E
. . . Y - - - - - - - - - - - - - - - - - - - -
---------TAT------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E E I N N I A H K I A V G A V R Y N I V R I S P
- - - - - - - - - - - - - - - - - - - - - - S .
------------------------------------------------------------------TCG---
433434435436437438439440441442443444445446447448449450451452453454455456
D K A M V F R W D D A L D F E K V G A P V I Q Y
. . . M . . . . . . . . . . . . . . . . . . . .
---------ATG------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A H A R C C R I L E K E N T N E N K P I D A T E
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L F E Y D L N E H E K L L I K I L L K F P K I V
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E K S A D A K K P Q I M A T Y A L D V A Q T F N
. . S . . . . . . . . . . . . . . . . . . T . .
------TCA------------------------------------------------------ACA------
529530531532533534535536537538539540541542543544545546547548549550551552
R Y Y A N C P I F K E E N K N I V Y S R L E L V
R - - - - - - - - - - - - - - - - - - - - - - -
AGA---------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574
K C T K T I I E N A L N L L G I E C P G K M
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_arg_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F L E L K A Q A T S I L K E A I L K V G F E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E D S E L Q F E T S S H A D L A S R V A F R L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S I H K Q N P K E L A S R I V S A I E I P E G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y I G E V S A A G P Y I N F L A G R H Y M D E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V T A V R E E K E K F G C G A P K D R I L L E H
- - - - - - - - - - - - - - - - - - - - L L E H
------------------------------------------------------------CTCCTTGAGCAC
121122123124125126127128129130131132133134135136137138139140141142143144
T S A N P N G P L H V G H I R N S I I G D T L A
. S A N P N G P L H V G H I R N S I I G D T L A
---TCGGCAAACCCTAACGGCCCCCTGCACGTAGGGCATATCCGCAATTCGATTATAGGAGACACTCTTGCC
145146147148149150151152153154155156157158159160161162163164165166167168
R I L R R A G Y D V E V Q Y Y V N D M G R Q I A
R I - - - - - - - - E V Q Y Y V N D M G - - - -
CGCATC------------------------GAGGTCCAGTACTATGTTAACGACATGGGA------------
169170171172173174175176177178179180181182183184185186187188189190191192
V V S W A C E R F E L D L S R K S D A A I A D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y I K A N V E L D K N P D Y V K K I D A L M E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V E V G D L Q T I E R F D K A V S L A I A G I K
- - - - - - - - - - - - - - - - S L A I A G I K
------------------------------------------------TCCTTGGCTATTGCCGGGATCAAA
241242243244245246247248249250251252253254255256257258259260261262263264
E T L L R L N V V H D K F V N E S R F L K S G E
E T L L R L . . . . D K F V N E S R - - - - - -
GAAACCCTCCTCCGCTTA------------GATAAATTCGTGAATGAGTCTCGC------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V H D I V E R I K A T G R T E T D K G A L V V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L S D Y G F E K T L V I Q R S N G T S L Y T T R
- - - - - - - - - - - - - - - - - - - L Y T T R
---------------------------------------------------------CTCTACACGACCCGC
313314315316317318319320321322323324325326327328329330331332333334335336
D L A Y H E W K A G Q A D R I I D V F G A D H K
D L A Y H E - - - - - - - - - I D V F G A D H K
GACCTTGCCTACCATGAA---------------------------ATCGATGTTTTCGGAGCCGACCACAAG
337338339340341342343344345346347348349350351352353354355356357358359360
L I S G Q L R A T L N A I G I K E P E V V I F E
L I S G Q L R A T L N A I - - - - - - V V I F E
CTTATTTCCGGCCAGCTCAGGGCTACATTGAATGCAATA------------------GTCGTAATTTTTGAG
361362363364365366367368369370371372373374375376377378379380381382383384
F V S L P E G S M S T R R G Q F I S A D D L F D
F - - - - - - S M S T R - - - - - - - - - - - -
TTT------------------TCAATGAGCACTCGC------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R V T E A A F E Q V E S R R P E T S T E F K K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V A E M V G I G A V R Y D I V R V S P E K S T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F N W K E A L D F E K Q G A P Y I Q Y S H A R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
C S I L E K A K D E A A W D P A E E I T P S L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V E D S E I D L I K K M A M F D S I I D L G A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E L K P H V L A I Y A R E L A D S F N Q F Y R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V P V I A A E D E K V R A S R L A L V D C A R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569
V L A N S L D T L G I G A P E S M
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_arg_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D I K S N I I N A L K E V I S K E I C K E I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I K L D K T P N L E L G D Y S V N I C F R L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E L K K N P K I I A E E L V D K L K A M N I E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V K E I K A V N G Y I N F Y I D Y N K F A K N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M E E I D K K G N N Y G R G D K K S I K I I L E
- - - - - - - - - - - - - - - - - - - - - I L E
---------------------------------------------------------------ATCTTAGAA
121122123124125126127128129130131132133134135136137138139140141142143144
H T S A N P N G P L H I G H L R N A I I G D C L
H . S A N P N G P L H I G H L R N A I I G D C L
CAT---TCAGCAAATCCAAATGGGCCTTTACATATTGGACATTTAAGAAATGCCATTATTGGAGATTGTTTA
145146147148149150151152153154155156157158159160161162163164165166167168
K R I L E F Y G Y D V E T H Y Y V N D M G R Q M
K R I - - - - - - - - E T H Y Y V N D M G - - -
AAGAGAATA------------------------GAAACCCACTACTATGTAAATGATATGGGT---------
169170171172173174175176177178179180181182183184185186187188189190191192
A L V V Y G I E L F G L D K E K K K D H A I A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T Y V K I N K Y L E E H P E E E E K I L E L M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K Y E D A L E N N E D N E I T K K F E F A V N Y
- - - - - - - - - - - - - - - - - - - - - - N Y
------------------------------------------------------------------AATTAT
241242243244245246247248249250251252253254255256257258259260261262263264
A L D G I K E T L K N L N I K H D T F V W E S S
A L D G I K E T L K N L . . . . D T F V W E S S
GCATTGGATGGAATAAAAGAGACATTAAAGAATTTA------------GATACCTTTGTTTGGGAAAGCTCT
265266267268269270271272273274275276277278279280281282283284285286287288
Y V R N G M V K K V I E K L M E T G K V I K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T Y M L D L S D F G I E K K M V L A R A N G T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L Y S T R D I A Y H L D K L S K C D I G I D V L
L Y S T R D I A Y H L - - - - - - - - - I D V L
TTGTATTCAACAAGAGATATTGCCTATCACTTA---------------------------ATAGATGTCTTA
337338339340341342343344345346347348349350351352353354355356357358359360
G A D H K L T A E M V K A A L K L L G S K V P E
G A D H K L T A E M V K A A L K L L - - - - - -
GGGGCTGACCACAAATTAACGGCAGAGATGGTTAAAGCAGCTTTAAAACTCCTT------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V I F Y E F I S L P E G S M S T R R G R F I S T
V I F Y E . . . . . . . . . . . . . . . . . . .
GTTATATTCTATGAA---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D E L L E E A I K R A K E E C N K R G V E E N I
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A Y D I G L G A V R Y N I A R I S P E K P M V F
. Y - - - - - - - - - - - - - - - - - - - - - -
---TAT------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R W E E A L D F E K V G C P F I Q Y A H A R C C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S I L K E A E N K G V K D E A V F N Y E L T S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E K E L I K M L D E F K D I I K E S A E S R R V
- - - - - - - - - - - - - - - - - - - - S . . .
------------------------------------------------------------AGT---------
505506507508509510511512513514515516517518519520521522523524525526527528
H I L A N Y L L E L A K A F N R F Y A N C P I L
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
M T K V D D D V K K S R L K L V K S T K T V L E
M . . . . . . . . . . . . . . . . S T . . . . .
ATG------------------------------------------------AGCACT---------------
553554555556557558559560561562563564565566
T G L E L L G I N C P G R M
. . . . . . . . . . . . R -
------------------------------------AGG---
Class I
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_arg_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P D Q P S R R V Y E A A P Q R L L A R A V A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L E R Q G A S L S E E E R R Q I E Y T V A E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P N P E L G D Y G I P L A R Y A R R Y R A D I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R L F E D A S S I L A E E P I V S E A K R A G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y L N I T L N A V E A A R L V F D A A R R E G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G Y G R V K T D K P M R I V V E H T S A N P V H
- - - - - - - - - - - - - V V E H . S A N P V H
---------------------------------------GAGGGCCTCCTC---GCTGAAGGTCATGGGCTT
145146147148149150151152153154155156157158159160161162163164165166167168
P L H I G H A R N A S L G D T L A R L L R A R G
P L H I G H A R N A S L G D T L A R L - - - - -
AGAGGCTGACACTGAGACGAGGGTGTAGCGCACCGCTGCCGTACCAACCGCCTCTGC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
H V V Q T R F Y I N D M G R Q V A V L A Y G Y I
- - - Q T R F Y I N D M G - - - - - - - - - - -
---------GAGGTCTGGGCTTCTCTTCTCCACCTCTCT---------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A A G L G E P P E G V K P D H W I G L V Y A I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H T L A D I E E L K K R L E R L R K E E R Y E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y R Q L L R E L D E L V A D A S R L R E R D P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L F E R I A K A L Q G R N P E E E I S R L M Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y E Y R R G P E K V E K I R R V V N L C L Q G F
- - - - - - - - - - - - - - - - - N L C L Q G F
---------------------------------------------------GTCGAGTGCGAGGGCTCCCTT
313314315316317318319320321322323324325326327328329330331332333334335336
R E T L G R L G I V I D K W D W E S E L A W T S
R E T L G R L . . . . D K W D W E S E - - - - -
GTGCACTGTGGCGTAGGGGCT------------CTCGAGTATCTTGGAGACCATGCT---------------
337338339340341342343344345346347348349350351352353354355356357358359360
M V S K I L E Q A R R S P Y A T V H K G A L A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D L Q P L L K D P V V R K H L G V P E S Y E V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P L I L Q R S D G T T L Y T T R D I A Y S I K K
- - - - - - - - - - - L Y T T R D I A Y S I - -
---------------------------------CTTGGCTATCCTCTCAAATAGGGCTGGGTCCCG------
409410411412413414415416417418419420421422423424425426427428429430431432
F R E F N A G K V F N V I A A E Q R L E Q L Q V
- - - - - - - - - F N V I A A E Q R L E Q L Q V
---------------------------GTCGAGCTCGCGGAGGAGCTGGCGGTACTCCTCGTACCTCTCCTC
433434435436437438439440441442443444445446447448449450451452453454455456
R L A L I A L G Y R R E G L N M I H Y A Y E M V
R L A L I A L - - - - - - - - M I H Y A Y - - -
CTTTCTGAGCCGCTCTAACCT------------------------GAGCGTATGCGTTATGGC---------
457458459460461462463464465466467468469470471472473474475476477478479480
N L P G Q K M S G R R G R Y I T L D E L L D Q A
- - - - - K M S G R - - - - - - - - - - - - - -
---------------TGGCTTAACCCCCTC------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V E M A R R E V E K R S P D L P E D E K K R I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E A V G T A A V R Y T L V S V S A S K P M T F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I E E A L N F E R N S A P Y V L Y T H A R A S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I L A K A R E R G I S L D W D S I D Y T A A E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N Q L R R S L V L Q A L I Y P Y I F A K A A D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q R P E L I V A Y L N R L A D T F N K W Y T S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D S A V N E P D P G K R V F K L A L V Y T V K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665
I L A N A L D L L G I K A V E R M
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Bacteria/Escherichia coli/amino acid sequences/Ecoli_arg_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N I Q A L L S E K V R Q A M I A A G A P A D C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E P Q V R Q S A K V Q F G D Y Q A N G M M A V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K K L G M A P R Q L A E Q V L T H L D L N G I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S K V E I A G P G F I N I F L D P A F L A E H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q Q A L A S D R L G V A T P E K Q T I V V D Y S
- - - - - - - - - - - - - - - - - - - V V D Y .
---------------------------------------------------------GTGGTTGACTAC---
121122123124125126127128129130131132133134135136137138139140141142143144
A P N V A K E M H V G H L R S T I I G D A A V R
A P N V A K E M H V G H L R S T I I G D A A V R
GCGCCAAACGTGGCGAAAGAGATGCATGTCGGTCACCTGCGCTCTACCATTATTGGTGACGCAGCAGTGCGT
145146147148149150151152153154155156157158159160161162163164165166167168
T L E F L G H K V I R A N H V G D W G T Q F G M
T - - - - - - - - I R A N H V G D W G - - - - -
ACT------------------------ATTCGCGCAAACCACGTCGGCGACTGGGGC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
L I A W L E K Q Q Q E N A G E M E L A D L E G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y R D A K K H Y D E D E E F A E R A R N Y V V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L Q S G D E Y F R E M W R K L V D I T M T Q N Q
- - - - - - - - - - - - - - - - D I T M T Q N Q
------------------------------------------------GACATCACCATGACGCAGAACCAG
241242243244245246247248249250251252253254255256257258259260261262263264
I T Y D R L N V T L T R D D V M G E S L Y N P M
I T Y D R L N - - - - - - D V M G E S L - - - -
ATCACCTACGATCGTCTGAAC------------------GACGTCATGGGTGAAAGTCTC------------
265266267268269270271272273274275276277278279280281282283284285286287288
L P G I V A D L K A K G L A V E S E G A T V V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L D E F K N K E G E P M G V I I Q K K D G G Y L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------CTC
313314315316317318319320321322323324325326327328329330331332333334335336
Y T T T D I A C A K Y R Y E T L H A D R V L Y Y
Y T T T D I A C A K - - - - - - - - - - - L Y Y
TACACCACCACTGATATCGCCTGTGCGAAA---------------------------------CTGTATTAC
337338339340341342343344345346347348349350351352353354355356357358359360
I D S R Q H Q H L M Q A W A I V R K A G Y V P E
I D S R Q H Q H L M Q A W A I V R K A - - - - -
ATCGATTCCCGTCAGCATCAACACCTGATGCAGGCATGGGCGATCGTCCGTAAAGCG---------------
361362363364365366367368369370371372373374375376377378379380381382383384
S V P L E H H M F G M M L G K D G K P F K T R A
- - - L E H H M F - - - - - - - - - P F K T R -
---------CTGGAACACCACATGTTC---------------------------CCGTTCAAAACCCGC---
385386387388389390391392393394395396397398399400401402403404405406407408
G G T V K L A D L L D E A L E R A R R L V A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N P D M P A D E L E K L A N A V G I G A V K Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D L S K N R T T D Y I F D W D N M L A F E G N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A P Y M Q Y A Y T R V L S V F R K A E I N E E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L A A A P V I I R E D R E A Q L A A R L L Q F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E T L T V V A R E G T P H V M C A Y L Y D L A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L F S G F Y E H C P I L S A E N E E V R N S R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K L A Q L T A K T L K L G L D T L G I E T V E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577
M
-
---
Class I
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_arg_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R Y A L E R F I T D I K D A I A A T G K V P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D L I E I T T P K P N I P A D R T F V T F K A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K V L G V D P A K L A A E L A A T I A P P P D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L I G E V T A T G A F L N F S L H P Q R L A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V L N E I E T A G E A Y G T V A D G A G R T V V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GTG
121122123124125126127128129130131132133134135136137138139140141142143144
I D Y S S P N I A K R M H V G H I R S T I I G Q
I D Y S . P N I A K R M H V G H I R S T I I G Q
ATCGATTATTCT---CCCAATATCGCCAAGCGCATGCACGTCGGCCATATCCGCTCGACGATTATCGGGCAG
145146147148149150151152153154155156157158159160161162163164165166167168
A L V H I F R A L G Y R V I G D N H L G D W G T
A L V H I - - - - - - - - I G D N H L G D W G -
GCGCTCGTTCATATC------------------------ATCGGCGATAACCATCTCGGCGACTGGGGG---
169170171172173174175176177178179180181182183184185186187188189190191192
Q F G I I L A A M Q R Y G R P Q N E G E A A M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E L E A L Y A R Y N A E M K D D P A L E D E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R W S L A L E R G D P E A R S L W Q W C V D L S
- - - - - - - - - - - - - - - - - - - - - D L S
---------------------------------------------------------------GATCTGTCA
241242243244245246247248249250251252253254255256257258259260261262263264
L R A A Q R N Y D R L G I R F D Y A Y G E S F Y
L R A A Q R N Y D R L G - - - - Y A Y G E S F -
TTGCGGGCCGCCCAACGCAACTACGACCGGCTCGGC------------TACGCCTACGGCGAAAGCTTC---
265266267268269270271272273274275276277278279280281282283284285286287288
E A M L P G V I E E A L R S E A A F R D V D G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V V A E L D K L P K F I I Q R S D G G T V Y M T
- - - - - - - - - - - - - - - - - - - - V Y M T
------------------------------------------------------------GTCTATATGACC
313314315316317318319320321322323324325326327328329330331332333334335336
R D I A T I K F R L Q E F S P S H I I Y V V D A
R D I A T I K - - - - - - - - - - - I Y V V D A
CGTGACATCGCGACGATTAAA---------------------------------ATCTACGTGGTTGATGCT
337338339340341342343344345346347348349350351352353354355356357358359360
R Q E L H F R Q L F A I V R A M G Y A R D V E L
R Q E L H F R Q L F A I V R A M - - - - - - - L
CGCCAGGAACTGCACTTCCGCCAGCTCTTCGCAATCGTGCGGGCGATG---------------------CTG
361362363364365366367368369370371372373374375376377378379380381382383384
V H V P F G V I T T P D G Q P L S T K K G N M V
V H V P F - - - - - - - - - P L S T K - - - - -
GTGCATGTCCCGTTC---------------------------CCCCTCTCGACCAAG---------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y L E A L L D D A V A R A R A L V D A K S A D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P L E E R A A I A E A V G I G A V I Y N D L Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D P R R N I T L D W D R M L S I E G N S A A Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q Y S H A R C R S I L R R A A D E G V A L A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
D L T L L T H P S E Q R L I R H L A R L P E A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R E A G A R Y A P F V I A D W C Y T T A R E F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I F F E Q C P V L R A E T P A L R A A R L Q L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574
A A T A N A L R N G L A L L G I Q A P E R M
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_arg_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L K I L V M A A P L A Q L R D R F Q A A L A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S F G P E W A A T D P L L V P A T N P K F G D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q S N V A M S L A K Q L G Q P P R A I A E T L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q N L N L A D L C E P P A I A G P G F I N F T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q P S Y L V A Q L Q Q L Q T D E R L G I Q P V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P P Q R V I V D F S S P N I A K E M H V G H L R
- - - - - I V D F S . P N I A K E M H V G H L R
---------------CAGCGCCAGCATCTT---AAAGCTAAAGATGTAGTTGCTGTTGCGGTTCTGGCTAAG
145146147148149150151152153154155156157158159160161162163164165166167168
S T I I G D S I A R V L E F Q G H E V L R L N H
S T I I G D S I A R V - - - - - - - - L R L N H
GTCAGCGTACTTCACCGCGCCAAGACCAACCGC------------------------CGGGGTTTCCGATCG
169170171172173174175176177178179180181182183184185186187188189190191192
V G D W G T Q F G M L I A F L Q E Q Y P Q A L S
V G D W G - - - - - - - - - - - - - - - - - - -
CTCTTCAGCAGCAAT---------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q P D A L D I S D L V A F Y K Q A K A R F D E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P S F Q E T A R Q R V V D L Q S G E A T A R Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
W Q L L C D Q S R R E F Q K I Y D R L D I Q L E
- - - - - D Q S R R E F Q K I Y D R L D - - - E
---------------AACGTAGATAATCCGCTGGGCCTGATCTTGACCCAGGCGATAACG---------CAA
265266267268269270271272273274275276277278279280281282283284285286287288
E R G E S F Y N P Y L P A I V E D L R R L G L L
E R G E S F - - - - - - - - - - - - - - - - - -
ATCCGTCGTGGCGTAGTT------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V E D Q G A Q C V F L E G F Q N K E G Q P L P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I V Q K S D G G Y N Y A T T D L A A L R Y R L G
- - - - - - - - - N Y A T T D L A A L R - - - -
---------------------------GAAGCTCTCACCCCGTTCTTCGAGCTGAATATC------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q D Q A Q R I I Y V T D S G Q A N H F A Q V F Q
- - - - - - - I Y V T D S G Q A N H F A Q V F Q
---------------------CGATTGATCGCAAAGCAACTGCCATGCCTGACGCGCCGTAGCTTCACCCGA
361362363364365366367368369370371372373374375376377378379380381382383384
V A Q R A G W L P A A A Q I E H V P F G L V Q G
V A Q R A - - - - - - - - I E H V P F - - - - -
CTGCAGATCGACCAC------------------------GCTCGGGTCTTCGTCAAA---------------
385386387388389390391392393394395396397398399400401402403404405406407408
E D G K K L K T R A G D T V R L R D L L D E A V
- - - - K L K T R - - - - - - - - - - - - - - -
------------TACCAAGTCACTGAT---------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D R A R T D L T T R I A A E E R S E T P E F I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A V A Q A V G L G A V K Y A D L S Q N R N S N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I F S F D K M L A L Q G N T A P Y L L Y A Y V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I Q G I A R K G G I D F A Q L D P V A A V L T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P T E R S L A K Q V L Q L G E V L D E V A R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L P N R L C S Y L F E L S Q T F N Q F Y D R C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I L N A E E P Q R T S R L L L C D L T A R T L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590
L G L S L L G I S V L E R M
- - - - - - - - - - - - - -
------------------------------------------
Class I
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_arg_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K I E D K L V T S V I S G L K A L Y G Q D V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A A Q V Q L Q K T K K E F E G H L T L V V F P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L K M S K K G P E Q T A Q E I G E Y L K A N E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A V A A F N V I K G F L N L T V A S A T W I E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L N E I H T D A Q Y G I V S A D E N A P L V M I
- - - - - - - - - - - - - - - - - - - - - - M I
------------------------------------------------------------------ATACTG
121122123124125126127128129130131132133134135136137138139140141142143144
E Y S S P N T N K P L H L G H V R N N L L G N A
E Y S . P N T N K P L H L G H V R N N L L G N A
GATAAAAGG---TGTATTACCGTTAAAGTCGATAGACTCTTTCGGATTGAAAGTCATATTTTTACGGGCATC
145146147148149150151152153154155156157158159160161162163164165166167168
L A N I V M A N G N K V V K T N I V N D R G I H
L A N I - - - - - - - - V K T N I V N D R G - -
CACTTTCAGGAT------------------------AACGATACGTGCAATATCGTCCGCCTCTTC------
169170171172173174175176177178179180181182183184185186187188189190191192
I C K S M L A W Q K Y G K G E T P E S S G K K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D H L V G D Y Y V A F D K H Y K A E V A E L M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K G M S K E E A E A A S P L M N E A R E M L V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
W E A G D P E V R A L W Q M M N N W V Y A G F D
- - - - - - - - - - - - - - - - N W V Y A G F D
------------------------------------------------ACGCAGCTTAGCCGTACCGATGTC
265266267268269270271272273274275276277278279280281282283284285286287288
E T Y R K M G V G F D K I Y Y E S N T Y L E G K
E T Y R K M . . . . D K I Y Y E S N - - - - - -
CTGAGTCATGTATACCGA------------GCGAAGCAACAGTTTGTGATCCAA------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E K V M E G L E K G F F F K K E D G S V W A D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T A E G L D H K L L L R G D G T S V Y M T Q D I
- - - - - - - - - - - - - - - - - V Y M T Q D I
---------------------------------------------------CTTACGGTACGTTTCATCAAA
337338339340341342343344345346347348349350351352353354355356357358359360
G T A K L R F A D Y P I D K M I Y V V G N E Q N
G T A K - - - - - - - - - - - I Y V V G N E Q N
ACCGGCGTATAC---------------------------------TTCCGGATCACCGGCTTCCCATTTCAC
361362363364365366367368369370371372373374375376377378379380381382383384
Y H F Q V L S I L L D K L G F E W G K S L V H F
Y H F Q V L S I L L D K L - - - - - - - L V H F
CAACATCTCACGCGCTTCATTCATCAACGGGGAGGCAGC---------------------GCCTTTCTCCAT
385386387388389390391392393394395396397398399400401402403404405406407408
S Y G M V E L P E G K M K S R E G T V V D A D D
S Y - - - - - - - - K M K S R - - - - - - - - -
CAGTTC------------------------ATCGAAAGCGACATA---------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L M A E M I A T A K E T S Q E L G K L D G L T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E E A D D I A R I V G L G A L K Y F I L K V D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R K N M T F N P K E S I D F N G N T G P F I Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T Y A R I R S V L R K A A E A G I V I P E V L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A N I E L S E K E E G L I Q M V A D F A A V V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Q A G E D Y S P S G I A N Y V Y D L V K E Y N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F Y H D F S I L R E E N E D V K L F R I A L S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597
N I A K V V R L G M G L L G I E V P D R M
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_arg_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D T F A R F E Q A I R D A L L D T T L I P A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L I D L V A P K A S G V Q A D L A L P C F R V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K L R G I N P A Q F A Q T L A N A L K F T P E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L V L K A S A L G A Y V N F S L N P V T F A Q S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V L H D I S Q R K A E Y G R S T K G Q N Q A V V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------TGA
121122123124125126127128129130131132133134135136137138139140141142143144
V D Y S S P N I A K R M R V D H I R S T M I G Q
V D Y S . P N I A K R M R V D H I R S T M I G Q
ACTATTGCCATC---GGCCAACATGCGCTCCCAATCGACCACCACATCGTGGGCTGGATCGTGCTGTAAATT
145146147148149150151152153154155156157158159160161162163164165166167168
A I V N I Y R A L G Y H V I R M N H W G D Y D P
A I V N I - - - - - - - - I R M N H W G D Y D -
GTGATAAATGACTGC------------------------TTCATTGATTTCTGTGCTCGAAAAGGGGAT---
169170171172173174175176177178179180181182183184185186187188189190191192
Q L G I S L A A M Q H F Q H R N G N G E S M L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S L E Q Q T Q Q Y H A D D Q V H D L A Q A W A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K L T K G E P Q A I K L L Q Q L V D L S L T A N
- - - - - - - - - - - - - - - - - D L S L T A N
---------------------------------------------------GCGAAAATGCAATTCTTGCGC
241242243244245246247248249250251252253254255256257258259260261262263264
Q A N Y R R L G V A F D V Q H C E S F Y A R E A
Q A N Y R R L G - - - - V Q H C E S F - - - - -
TTGCTTAACCACATAAATAATTTT------------TAGCTCCTCGCGATATTTAAT---------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q V V I K E A L H Y Q I A Q L D G H V A V V K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L L D E Q G K A L P T L L L N R S D G S S L Y I
- - - - - - - - - - - - - - - - - - - - - L Y I
---------------------------------------------------------------GATGACCAC
313314315316317318319320321322323324325326327328329330331332333334335336
T R D I A A I K Y R E E L Y Q P T K I I Y V V K
T R D I A A I K - - - - - - - - - - - I Y V V K
TTGGGCTTCGCGAGCATAAAAACT---------------------------------ACGGCGATAATTGGC
337338339340341342343344345346347348349350351352353354355356357358359360
Q A Q E L H F R Q A F T I S K T L G Y T K A D L
Q A Q E L H F R Q A F T I S K T L - - - - - - L
TTGGTTGGCAGTTAAACTCAAATCAACAAGCTGCTGTAAAAGCTTGATCGC------------------CAG
361362363364365366367368369370371372373374375376377378379380381382383384
S H V A C G M I L G P E R R S P S G A R F S T M
S H V A C - - - - - - - - - - P S G A R - - - -
TTTGCTAGCCCAAGC------------------------------ATGATATTGTTGGGT------------
385386387388389390391392393394395396397398399400401402403404405406407408
I Y L E P L L D E A C T R A K A L I K Q K A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S K I P F S S T E I N E I A E Q V G V G A V I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
H N L Q H D P A H D V V V D W E R M L A F D G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S S T Y L Q Y M H A R C C S I L R D F G R I P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N Y D G R V L T H S A E Q A L L K E L A R L P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V I V D A A E R Y A P F V V S D W L Y A T A K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F A V F Y D S C S V L K A E T L A L R A A R G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L V A A T A Q A L R N G L G L L S I A A P E R M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_arg_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L P A Q K H T L E T L L E N S V K Q V V Q A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K G D A D A A F V L P A I A L E R P K V A A H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V A C N V A L Q L A K P L G A N P R Q L A E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I V A A L T A Q P A A A G L V D A A E I A G P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F I N L R L T P A S K Q A V I G A V F A Q G R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F G A S E R E H G K R V L L E F V S A N P T G P
- - - - - - - - - - - - L L E F . S A N P T G P
------------------------------------TTTCAGCGCGAG---GATGTCGAACACGAACTCGGT
145146147148149150151152153154155156157158159160161162163164165166167168
L H V G H G R Q A A L G D A L A N V L A S Q G Y
L H V G H G R Q A A L G D A L A N V - - - - - -
GTCCGCCTTGCGGGAAATCAGGAAGAAGCGCACCGCGTCGCGCCCGCGCGTGAT------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A V H R E F Y Y N D A G V Q I G N L A I S T Q A
- - H R E F Y Y N D A G - - - - - - - - - - - -
------CGAGACTTCCGAGCCCGGCGTCGCGCCGCC------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R A R G L K P G D A G W P E A A Y N G E Y I A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I A R D Y L N G E T V A A S D G E P V T G K R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A D D L E A I R K F A V A Y L R R E Q D M D L K
- - - - - - - - - - - - A Y L R R E Q D M D L K
------------------------------------GCGCTCCCACTTCGTCACGTGGTACGCGACGTCCGG
265266267268269270271272273274275276277278279280281282283284285286287288
A F G V K F D Q Y Y L E S S L Y T E G R V E K T
A F . . . . D Q Y Y L E S S - - - - - - - - - -
CACGAA------------GCCGTCCGTCTTGCGCATCACACG------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V D A L I A A G M T Y E Q E G A L W L R T T D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G D D K D R V M R K T D G T Y T Y F V P D V A Y
- - - - - - - - - - - - - - - T Y F V P D V A Y
---------------------------------------------CACGCCGAACGCCTTCAGGTCCATGTC
337338339340341342343344345346347348349350351352353354355356357358359360
H V T K W E R G F T K V I N I Q G S D H H G T I
H V - - - - - - - - - - I N I Q G S D H H G T I
CTGTTC------------------------------GATCGCCTCGAGATCATCGGCGTCGCGCTTGCCCGT
361362363364365366367368369370371372373374375376377378379380381382383384
A R V R A G L Q G L H I G I P K G Y P D Y V L H
A R V R A G L Q G . . I - - - - - - P D Y V L H
CACCGGCTCGCCGTCGCTCGCCGCGAC------GCC------------------GATGTCGGCGATGTACTC
385386387388389390391392393394395396397398399400401402403404405406407408
K M V T V M R D G Q E V K I S K R A G S Y V T V
- - - - - - - - - - - - K I S K R - - - - - - -
------------------------------------GGGCTTGAGGCCGCG---------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R D L I E W S G G A T P G S E V S P E L L D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T I T R G R D A V R F F L I S R K A D T E F V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D I D L A L K Q N D E N P V Y Y V Q Y A H A R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
C S V L N E W K S R Y G A T D A L L P G A D L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P L D S K Q A M A L M Q K L A E Y P D V L A H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A N E L A P H A V A F Y L R E L A S E F H S F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
N A E R V L V D E E A P R T A R I A L L A A T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594
Q V L E N G L A M L G V S A P S K M
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_arg_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N I V E Q M K D V L K Q E I K E A V M K A G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A A E S E I P E V V L E V P K D K S H G D Y S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N M A M Q L A R I A K K A P R N I A E E I V A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F D K G K A S I D K L D I A G P G F I N F Y M N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N Q Y L T K L I P A V L E A G E A Y G E T N I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G G E R V Q V E F V S A N P T G N L H L G H A R
- - - - - Q V E F . S A N P T G N L H L G H A R
---------------ATTCTCATTAGA---TGAGACGGCCAGATCAAGGTCAAAGTCCATATGGGTATCGGC
145146147148149150151152153154155156157158159160161162163164165166167168
G A A V G D S L C N V L E K A G Y E V S R E Y Y
G A A V G D S L C N V - - - - - - - - S R E Y Y
GCTGCGCATCGCAAAGAAGTAACGCACAGCGTC------------------------GCGCATTGTGACGGC
169170171172173174175176177178179180181182183184185186187188189190191192
I N D A G N Q I N N L A L S V E A R Y F Q A L G
I N D A G - - - - - - - - - - - - - - - - - - -
TTTTCCGGTTCTTTT---------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K D K P M P E D G Y H G E D I K E I G R K L A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E F G D R F V H E E E S E R L A F F R E Y G L K
- - - - - - - - - - - - - - - - - - - - - - - K
---------------------------------------------------------------------CAG
241242243244245246247248249250251252253254255256257258259260261262263264
Y E L G K L R E D L E N F R V P F D V W Y S E T
Y E L G K L R E D L E N F . . . . D V W Y S E T
AAGATACGTGTAGGATCCGTCTTTTTTGATCAGCACGCG------------GCCGAACGCCGTCGAGCGGAA
265266267268269270271272273274275276277278279280281282283284285286287288
S L Y Q N G K I D Q A L E A L R E K G H I Y E E
S - - - - - - - - - - - - - - - - - - - - - - -
CCA---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D G A T W F R S T A F G D D K D R V L I K K D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S Y T Y L L P D I A Y H K D K L D R G F Q K L I
- - T Y L L P D I A Y H K - - - - - - - - - - I
------CAATTCGTACTTTAAGCCGTATTCGCGGAAAAA------------------------------AAA
337338339340341342343344345346347348349350351352353354355356357358359360
N V W G A D H H G Y I P R M K A A I E A L G Y D
N V W G A D H H G Y I P R M K A A I E A L - - -
ACGATCGCCGAATTCGTCGGCGAGCTTTTGGCCGATTTCCTTAATATCTTCGCCGTGATACCC---------
361362363364365366367368369370371372373374375376377378379380381382383384
K E T L E V E I I Q L V H L Y K N G E K M K M S
- - - L E V E I I - - - - - - - - - - - - K M S
---------ATCTTTTCCAAGCGCCTG------------------------------------GATTTGATT
385386387388389390391392393394395396397398399400401402403404405406407408
K R T G K A V T M R D L I D E V G L D A V R Y F
K R - - - - - - - - - - - - - - - - - - - - - -
GCCGGC------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F A M R S A D T H M D F D L D L A V S T S N E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P V Y Y A Q Y A H A R I C S M L R Q G E E K G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S F E G N L D L T K I A S E K E Y D L L K V I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S F P E A V A D A A E K R I P H R I T N Y I F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L A S V L H S F Y N A E K V L D P A D E E K S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A R L S L M K A T Q I T L N N A L K L I G V S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556
P E K M
- - - -
------------
Class I
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_arg_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L V N A I R Q K V S E V I S K A Y G S E I E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E V E I P P R K E F G D L S T N V A M K L A K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L K K N P R E I A Q E I V K S L D E D P S F D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I E I M G P G F I N F F L S N E L L R G V V K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V L E K K D E Y G R E N V G N G M K V Q F E Y G
- - - - - - - - - - - - - - - - - - - Q F E Y .
---------------------------------------------------------CAGTTCGAATAC---
121122123124125126127128129130131132133134135136137138139140141142143144
S A N P T G P F T V G H G R Q I I I G D V L S E
S A N P T G P F T V G H G R Q I I I G D V L S E
AGTGCAAACCCAACGGGACCATTCACCGTTGGGCACGGTAGACAGATCATCATAGGTGACGTGCTTTCCGAG
145146147148149150151152153154155156157158159160161162163164165166167168
V Y K E L G Y D V T R E M Y I N D A G K Q I R L
V - - - - - - - - T R E M Y I N D A G - - - - -
GTT------------------------ACGAGGGAAATGTATATAAACGACGCCGGA---------------
169170171172173174175176177178179180181182183184185186187188189190191192
L A Q S L W A R Y N Q L L G V E K E I P E G G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R G E Y L V D I A R D L V N E I G D R Y K D L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N E E V E E F F K Q T A L N R I L S S M K D T L
- - - - - - - - - - - - - N R I L S S M K D T L
---------------------------------------AACAGAATTCTCTCCTCCATGAAAGATACCCTT
241242243244245246247248249250251252253254255256257258259260261262263264
E K I G S S F D V Y F S E K S L I E D G T V E E
E K I . . . . D V Y F S E K S - - - - - - - - -
GAAAAGATT------------GATGTGTACTTCTCAGAAAAGAGT---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V L K L L K N K D V V Y E K D G A V W L K V S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F I D E E D K V L V R S D G T Y T Y F M T D I A
- - - - - - - - - - - - - - - - T Y F M T D I A
------------------------------------------------ACGTACTTCATGACGGATATCGCG
313314315316317318319320321322323324325326327328329330331332333334335336
Y H Y K K Y K R G F R K V Y D I W G S D H H G H
Y H Y - - - - - - - - - - Y D I W G S D H H G H
TATCACTAC------------------------------TACGACATCTGGGGTAGTGACCATCACGGTCAC
337338339340341342343344345346347348349350351352353354355356357358359360
I P R M K A A M K A L D I P D D F F N V I L H Q
I P R M K A A M K A L - - - - - - F N V I L H -
ATACCAAGAATGAAGGCAGCGATGAAAGCCCTC------------------TTCAACGTTATACTGCAT---
361362363364365366367368369370371372373374375376377378379380381382383384
F V T L K R G G E I V R M S T R A G E F V T L D
- - - - - - - - - - - R M S T R - - - - - - - -
---------------------------------CGCATGTCCACGCGA------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E L L D E V G R D A T R Y F F A M V D P N T H M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V F D I D L A K A K S M D N P V Y Y V Q Y A H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R I H N L F S N A E K K G V K F E E G K H L E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L G N E E E R V L M R N L G M F N T A L K E V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q M F A P N R L T N Y L Q S L A E S F H A F Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K H V I V D P E N P E L S N A R L N L A L A T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546
I V L R K G L K L I G V S A P E R M
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_arg_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N I V G Q M K E Q L K E E I R Q A A V K A G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V S A D E L P D V L L E V P R D K A H G D Y S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N I A M Q L A R I A K K P P R A I A E A I V G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L D R E R V S V A R I E V A G P G F I N F Y M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N R Y L T A V V P A I L Q A G Q A Y G E S N V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N G E K V Q V E F V S A N P T G D L H L G H A R
- - - - - Q V E F . S A N P T G D L H L G H A R
---------------CGGATTTTCATT---CTGCGACACGGCCAAGTCCATGTCAAAATCCAAATGCGTATC
145146147148149150151152153154155156157158159160161162163164165166167168
G A A V G D S L C N I L A K A G F D V T R E Y Y
G A A V G D S L C N I - - - - - - - - T R E Y Y
GCCCGAGCGCATCGCAAAGAAATAGCGGACGGC------------------------CTCGCGCATCGTCAC
169170171172173174175176177178179180181182183184185186187188189190191192
I N D A G K Q I Y N L A K S V E A R Y F Q A L G
I N D A G - - - - - - - - - - - - - - - - - - -
CGCCTTGCCGGTGCG---------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V D M P L P E D G Y Y G D D I V E I G K T L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E Y G D R F V H A D E E E R L A F F R E Y G L R
- - - - - - - - - - - - - - - - - - - - - - - R
---------------------------------------------------------------------CGG
241242243244245246247248249250251252253254255256257258259260261262263264
Y E L D K I K Q D L A A F R V P F D V W Y S E T
Y E L D K I K Q D L A A F . . . . D V W Y S E T
AAGCAAGTACGTATACGTGCCGTCCTGCTTAATTAAGAC------------GTCCCCAAACGCCGTCGAACG
265266267268269270271272273274275276277278279280281282283284285286287288
S L Y E S G K I D E A L S T L R E R G Y I Y E Q
S - - - - - - - - - - - - - - - - - - - - - - -
GAA---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D G A T W F R S T A F G D D K D R V L I K Q D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T Y T Y L L P D I A Y H Q D K L R R G F T K L I
- - T Y L L P D I A Y H Q - - - - - - - - - - I
------GTCGAGCTCATAACGAAGGCCGTATTCGCGGAA------------------------------GAC
337338339340341342343344345346347348349350351352353354355356357358359360
N V W G A D H H G Y I P R M K A A I A A L G Y D
N V W G A D H H G Y I P R M K A A I A A L - - -
GAACCGATCGCCATATTCCTCAGCAAGTGTTTTGCCGATTTCGACAATGTCGTCGCCGTAATA---------
361362363364365366367368369370371372373374375376377378379380381382383384
P E A L E V E I I Q M V N L Y Q N G E R V K M S
- - - L E V E I I - - - - - - - - - - - - K M S
---------CATATCGACACCGAGCGC------------------------------------GTAAATTTG
385386387388389390391392393394395396397398399400401402403404405406407408
K R T G K A V T M R E L M E E V G V D A V R Y F
K R - - - - - - - - - - - - - - - - - - - - - -
CTTGCC------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F A M R S G D T H L D F D M D L A V S Q S N E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P V Y Y V Q Y A H A R V S S I L R Q A E E Q N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S Y E G D L A L H H L V E T E K E I E L L K V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G D F P D V V A E A A L K R M P H R V T A Y A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E L A S A L H S F Y N A E K V L D L D N I E K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K A R L A L V K A V Q I T L K N A L A L I G V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557
A P E Q M
- - - - -
---------------
Class I
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_arg_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N I I D Q V K Q T L V E E I A A S I N K A G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A D E I P D I K I E V P K D T K N G D Y A T N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A M V L T K I A K R N P R E I A Q A I V D N L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T E K A H V K Q I D I A G P G F I N F Y L D N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y L T A I I P E A I E K G D Q F G H V N E S K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q N V L L E Y V S A N P T G D L H I G H A R N A
- - - L L E Y . S A N P T G D L H I G H A R N A
---------TTGCTTGAGTAT---TCAGCTAACCCTACAGGAGATTTACATATTGGTCATGCTAGAAATGCA
145146147148149150151152153154155156157158159160161162163164165166167168
A V G D A L A N I L T A A G Y N V T R E Y Y I N
A V G D A L A N I - - - - - - - - T R E Y Y I N
GCAGTTGGTGATGCTTTAGCTAATATT------------------------ACACGTGAATATTATATTAAT
169170171172173174175176177178179180181182183184185186187188189190191192
D A G N Q I T N L A R S I E T R F F E A L G D N
D A G - - - - - - - - - - - - - - - - - - - - -
GATGCTGGT---------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S Y S M P E D G Y N G K D I I E I G K D L A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H P E I K D Y S E E A R L K E F R K L G V E Y E
- - - - - - - - - - - - - - - - - - - - - E Y E
---------------------------------------------------------------GAATACGAA
241242243244245246247248249250251252253254255256257258259260261262263264
M A K L K N D L A E F N T H F D N W F S E T S L
M A K L K N D L A E F . . . . D N W F S E T S -
ATGGCTAAACTGAAAAATGATTTAGCAGAGTTC------------GATAATTGGTTTAGTGAAACATCT---
265266267268269270271272273274275276277278279280281282283284285286287288
Y E K G E I L E V L A K M K E L G Y T Y E A D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A T W L R T T D F K D D K D R V L I K N D G T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T Y F L P D I A Y H F D K V K R G N D I L I D L
T Y F L P D I A Y H F - - - - - - - - - - I D L
ACGTATTTCTTACCAGATATTGCGTACCACTTC------------------------------ATCGATTTA
337338339340341342343344345346347348349350351352353354355356357358359360
F G A D H H G Y I N R L K A S L E T F G V D S N
F G A D H H G Y I N R L K A S L E T F - - - - -
TTTGGTGCTGATCATCATGGTTATATTAACCGTTTGAAAGCATCTCTTGAAACGTTT---------------
361362363364365366367368369370371372373374375376377378379380381382383384
R L E I Q I M Q M V R L M E N G K E V K M S K R
- L E I Q I M - - - - - - - - - - - - K M S K R
---TTAGAAATTCAAATCATG------------------------------------AAGATGAGTAAACGT
385386387388389390391392393394395396397398399400401402403404405406407408
T G N A I T L R E I M D E V G V D A A R Y F L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
M R S P D S H F D F D M E L A K E Q S Q D N P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y Y A Q Y A H A R I C S I L K Q A K E Q G I E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A A A N D F T T I T N E K A I E L L K K V A D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E P T I E S A A E H R S A H R I T N Y I Q D L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S H F H K F Y N A E K V L T D D I E K T K A H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A M I E A V R I T L K N A L A M V G V S A P E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553
M
-
---
Class I
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_arg_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N L L T Q L R S L F E P A L T G L A P D R A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V P D L L G A I K P A A N A D N G D Y Q A N C A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M A L G K Q L G Q K P P E V A K A L V A A L P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N D L L E P P T V A G P G F I N L R L K P E F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A R A L Q E I A T D P K L G V S P A A K S K T F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V I D L S G P N V A K P L H V G H L R S T I I G
V I D L . G P N V A K P L H V G H L R S T I I G
GGCGTACTTCAC---ACCGACACCAACGACCTCCGCAATTTCTTGCTTTTCAGAGGCCTCCGCTTCATAGAT
145146147148149150151152153154155156157158159160161162163164165166167168
D A L V R I L R F L G H T V I G D N H L G D W G
D A L V R I - - - - - - - - I G D N H L G D W G
CTTGTGCCCGAACGAGCG------------------------CTTCTGGAGGCTCAGCGCGGCGGCTTCATT
169170171172173174175176177178179180181182183184185186187188189190191192
T Q F G I L L Y G Y K N H R D D A A F A A D P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R E L L R L Y I F V R K Q A A L A E G E D E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G A D N P V M A A C R A E T S K L H A N D P E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V A L W K S F M P A C M E M L R P I Y E R L D V
- - - - - - - - P A C M E M L R P I Y E R L D -
------------------------CGTGAAGGCTCCGTCGCGCTTGCGGATGATCGCCGGTGGCTCCTC---
265266267268269270271272273274275276277278279280281282283284285286287288
K I D H A L G E S F Y N P M L A G V V A D M L A
- - - H A L G E S F - - - - - - - - - - - - - -
---------CTCGGGCGTTTGGGGAACGAT------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K G I A V E S K G A I V I P N A K G I V P Q T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E E Q K K E E P P A I I R K R D G A F T Y T T T
- - - - - - - - - - - - - - - - - - - T Y T T T
---------------------------------------------------------CGGCATGAAGCTCTT
337338339340341342343344345346347348349350351352353354355356357358359360
D L A T I K Y R A E T W K P D A M L Y V V G A P
D L A T I K - - - - - - - - - - - L Y V V G A P
CCAGAGCGCGACGTTTTC---------------------------------GCGGCACGCCGCCATCACCGG
361362363364365366367368369370371372373374375376377378379380381382383384
Q A L H F K T V F A Q A K R W G V D G I E F Q H
Q A L H F K T V F A Q A K R W - - - - - - F Q H
GTTGTCCGCGCCGCCCTCTTCGTCCTCGCCTTCGGCCAGAGCCGC------------------GTACAGGCG
385386387388389390391392393394395396397398399400401402403404405406407408
V Q F G S M L G A D R K I F G T R K G G A L E L
V Q F - - - - - - - - - I F G T R - - - - - - -
CAGCAGTTC---------------------------GTCGTCGCGGTGGTT---------------------
409410411412413414415416417418419420421422423424425426427428429430431432
M E L L N E A A A L S L Q K Y E A N T A E R R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F G H K I Y E A E A S E K Q E I A E V V G V G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V K Y A D L S Q N R T T D Y V F D L D K M T A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V G N T A A Y M Q Y A Y A R C R S I F R E G G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D E G V F R T A P P A V T L P H A A E R A L A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
H L L R L P E A V E A A A A D Y A P H L I T A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L W D L A K A T S V F Y E G C S V L K A D T P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580
L K A S
- - - -
------------
Class I
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_arg_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K E T L E Q L K P R F E Q A L A A A L G A E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A G V D P I L V T A S N P K F G D Y Q A N V A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P L A K Q V G K P P R A I A E Q I V L K L D V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D F C E N P T V A G P G F I N L T L K P A Y L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A Q L Q K I N P D P R L G I A S V K H P K K V I
- - - - - - - - - - - - - - - - - - - - - - - I
---------------------------------------------------------------------ATT
121122123124125126127128129130131132133134135136137138139140141142143144
V D Y P S P N I A K E M H V G H L R P A V I G D
V D Y . S P N I A K E M H V G H L R P A V I G D
GTAGATTAT---AGCCCAAATATTGCTAAAGAAATGCACGTTGGGCATTTGCGTCCAGCTGTGATTGGAGAT
145146147148149150151152153154155156157158159160161162163164165166167168
C L S R I L E F I G H D V V R L S H V G D W G T
C L S R I - - - - - - - - V R L S H V G D W G -
TGTCTTTCTCGAATT------------------------GTGCGTCTGAGTCATGTAGGCGATTGGGGA---
169170171172173174175176177178179180181182183184185186187188189190191192
P F G M L I A Y L Q K A Y P E A L T T D E N L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L G D L S S F Y R Q A K K Q F D T D E G F K E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A R Q A V V Q L Q A G E E K T I L A W K I V C Q
- - - - - - - - - - - - - - - - - - - - - - - Q
---------------------------------------------------------------------CAA
241242243244245246247248249250251252253254255256257258259260261262263264
L S S R A Y R V I Y D L M G I A P F I E R G E S
L S S R A Y R V I Y D L M G - - - - I E R G E S
CTGTCTAGTAGAGCATATCGAGTTATTTACGATTTGATGGGA------------ATTGAAAGAGGAGAATCT
265266267268269270271272273274275276277278279280281282283284285286287288
F Y N A L L A E T I E E L E A K G L V E I D A G
F - - - - - - - - - - - - - - - - - - - - - - -
TTT---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A K C I F L E G F T N K E G K P L P L I V Q K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D G G Y N Y A T T D L A A I R Y R V N V D K A Q
- - - - N Y A T T D L A A I R - - - - - - - - -
------------AATTACGCTACAACAGATTTAGCTGCTATTCGC---------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R V I Y P V G A E Q T N H F A Q I F Q V G K R A
- - I Y P V G A E Q T N H F A Q I F Q V G K R A
------ATTTATCCAGTGGGTGCTGAGCAAACTAATCATTTTGCTCAAATTTTTCAGGTAGGAAAACGAGCG
361362363364365366367368369370371372373374375376377378379380381382383384
G W I T D E V E F F H A P F G L V L G E D G S K
- - - - - - - - F F H A P F - - - - - - - - - K
------------------------TTTTTTCACGCTCCTTTT---------------------------AAG
385386387388389390391392393394395396397398399400401402403404405406407408
L K T R S G E A V R L K D L L D E A I A H A R K
L K T R - - - - - - - - - - - - - - - - - - - -
TTGAAAACTCGC------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D L E S R L K E E G R E E T E E F I N H V A Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I G I S A V K Y A D L S Q N R N S N Y I F S Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K M L A L Q G N T A P Y M L Y A Y A R I Q G I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R K G G I D F E Q L G D N V K V V L Q H E T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V L A K H L L Q L D E V I S T I E E D L L P N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L C E Y L F Q L S Q K F N Q F Y D R D R G V P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L N A E E P Q R T S R L V L C N L T A R T L K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589
G L S L L G I P V L E R M
- - - - - - - - - - - - -
---------------------------------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_arg_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N K S V K K K I K D E I N V I V T N L A L S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N I K L D N I N I N I Q K P P K S D L G D I S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L M F E I G K T L K L P I E I I S E E I I K N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K T K Y E I K A V G P Y L N I K I S R K E Y I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N T I Q M V N T Q K D T Y G T S K Y L D N K K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I L E F S S P N T N K P L H V G H L R N D V I G
I L E F S . P N T N K P L H V G H L R N D V I G
GATATATGGTCCAGA---TCCCGTAAAAGACAGGCTTTCTTTTTTATTAAATACAATATCTTTATGTATAGC
145146147148149150151152153154155156157158159160161162163164165166167168
E S L S R I L K A V G A K I T K I N L I N D R G
E S L S R I - - - - - - - - T K I N L I N D R G
TGATTTTAGCAGATAATA------------------------TAAAGCATTTTTTTTAGCGCTCTCTTTATT
169170171172173174175176177178179180181182183184185186187188189190191192
V H I C K S M L A Y K K F G N G I T P E K A F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K G D H L I G D F Y V K Y N K Y S Q E N E N A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K E I Q D L L L L W E Q K D V S T I E L W K K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N K W A I E G I K E T Y E I T N T S F D K I Y L
- K W A I E G I K E T Y E I T N - - - - K I Y L
---ATAAATCATTTCTTCAAAATTAAATTCTTTTGTTCTAACTGCTAT------------TTGGGTAAGATA
265266267268269270271272273274275276277278279280281282283284285286287288
E S E I F K I G K N V V L E G L E K G F C Y K R
E S E - - - - - - - - - - - - - - - - - - - - -
GATAGATGT---------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E D G A I C I D L P S D S D E K A D T K V K Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V L I R S N G T S I Y L T Q D L G N I A V R T K
- - - - - - - - - I Y L T Q D L G N I A - - - -
---------------------------TTCAAGGTAAATTTTATCAAATGAGGTGTTTGT------------
337338339340341342343344345346347348349350351352353354355356357358359360
E F N F E E M I Y V V G S E Q I Q H F K S L F F
- - - - - - - I Y V V G S E Q I Q H F K S L F F
---------------------CCATTTATTTAACTTTTTCCAAAGTTCAATTGTGCTTACATCTTTTTGCTC
361362363364365366367368369370371372373374375376377378379380381382383384
V A E K L G L S K N K K L I H L S H G M V N L V
V A E K L - - - - - - - L I H L S H - - - - - -
CCAGAGTAAAAGTAG---------------------ATTTTCATTTTCTTGTGA------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D G K M K S R E G N V I D A D N L I S N L I E L
- - K M K S R - - - - - - - - - - - - - - - - -
------ATCGCCAATTAAATG---------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I I P E M T Q K I E N K E S A K K N A L N I A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G A I H Y Y L L K S A I H K D I V F N K K E S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S F T G N S G P Y I Q Y V G A R I N S I L E K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K A L S I P V M E K I D F E L L K H E K E W E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I K I I S E L E E N I I N A A K D L N P S I L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S Y S Y S L A K H F S T Y Y Q E V K V I D T N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I N L T A A R I E F L K A I L Q T I K N C M Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585
L N I P Y M L K M
- - - - - - - - -
---------------------------
Class I
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_arg_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N I D L V L R E A I Q N A F Q S V F E L S I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A D V N L Q P T R K E F E G T H T L I V F P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T T T C K V S P E V I A N K I G D W M Q T N T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A I A S Y N V V K G F L N L S I K D T I W L A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F N Q M Y Q N K H F G Y L P S N R Q K I V V E Y
- - - - - - - - - - - - - - - - - - - - V V E Y
------------------------------------------------------------GTAGTTGAATAT
121122123124125126127128129130131132133134135136137138139140141142143144
S S P N T N K P L H L G H L R N N F L G H A V S
S . P N T N K P L H L G H L R N N F L G H A V S
TCT---CCTAACACTAATAAACCCTTACACCTTGGTCATTTAAGGAATAATTTTCTAGGGCATGCTGTTAGT
145146147148149150151152153154155156157158159160161162163164165166167168
E I L Q A A G Y E V Y K V N L V N D R G I H I C
E I - - - - - - - - Y K V N L V N D R G - - - -
GAAATA------------------------TATAAGGTTAACTTAGTAAATGATCGAGGT------------
169170171172173174175176177178179180181182183184185186187188189190191192
K S M V A Y Q H W G R G E T P E S R G L K G D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L V G K Y Y V K F D Q V Y K E Q V A A L T Q T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G D A E Q A A K Q A P L L Q E A Q V M L K Q W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A G N E E V L A L W R K M N G W V Y D G F D I T
- - - - - - - - - - - - - - G W V Y D G F D I T
------------------------------------------GGTTGGGTATATGATGGCTTTGATATTACC
265266267268269270271272273274275276277278279280281282283284285286287288
Y Q K L G I T F D K V Y Y E S Q T Y L L G K E V
Y Q K L . . . . D K V Y Y E S Q - - - - - - - -
TATCAAAAGTTA------------GATAAAGTATATTATGAATCTCAG------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V A E G L A K G T F Y K K Q D G S V W I D L T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E G L D E K L L L R A D G T S V Y I T Q D L G T
- - - - - - - - - - - - - - - V Y I T Q D L G T
---------------------------------------------GTATATATAACCCAAGATTTAGGGACT
337338339340341342343344345346347348349350351352353354355356357358359360
A D L R Y Q D F K P N K L V Y V V G N E Q D Y H
A D - - - - - - - - - - - V Y V V G N E Q D Y H
GCTGAC---------------------------------GTTTATGTAGTAGGTAACGAACAAGATTATCAT
361362363364365366367368369370371372373374375376377378379380381382383384
F E V L A K I M A R L G R P Y A T D L Y H L S Y
F E V L A K I M A R L - - - - - - - L Y H L S Y
TTTGAAGTGCTTGCTAAAATTATGGCTCGTTTG---------------------CTATACCACCTCTCGTAT
385386387388389390391392393394395396397398399400401402403404405406407408
G M V D L P T G K M K S R E G T V V D A D M L I
- - - - - - - - K M K S R - - - - - - - - - - -
------------------------AAAATGAAGTCCAGG---------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D E M I E T A E E H T R E L G K I D G F S K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A K D L Y H I L A M G A L K Y F L L R V D A K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R L L F D P Q A S I D F Q G D T G P F I Q Y T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A R I A A V L R K V Q Q A D I A F N D I V E Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
N F V L H P L E R E V I V E L A A F P K K L Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S A L A Y A P A I L A Q H V L E I A K A Y N R M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y A E L S I L H E Q D T K V Q L F R I Q L S V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596
V A Q V I K T V M H L L G I V V P E R M
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_arg_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D L K A Q L K A A V E Q A A H Q M G M P V D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A I Q E T P A N K P G D Y G T P A A F Q M A K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A G G N P A Q I A A Q L A Q T V V L P A G I R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V E A T G P F L N F F L D A G A F V R G V V E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P F E L P K R E G K V V I E H T S V N P N K E L
- - - - - - - - - - - V I E H . S V N P N K E L
---------------------------------GTCATCGAGCAC---TCGGTCAACCCCAACAAAGAGCTG
121122123124125126127128129130131132133134135136137138139140141142143144
H V G H L R N V V L G D S M A R I L R A A G H T
H V G H L R N V V L G D S M A R I - - - - - - -
CACGTCGGGCACCTGCGTAACGTGGTGCTGGGCGACTCCATGGCGCGGATT---------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V E V Q N Y I D D T G R Q A A E S L F A T Q H Y
- E V Q N Y I D D T G - - - - - - - - - - - - -
---GAGGTACAGAACTACATCGACGACACCGGG---------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G R V W D G V Q K Y D Q W L G E G Y V Q L N A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P Q K P E L E S G I M E I M H K L E A G E L R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L V E Q T V K A Q L Q T C F R L G A R Y D L L N
- - E Q T V K A Q L Q T C F R L . . . . D L L N
------GAGCAGACGGTGAAGGCGCAGCTTCAGACCTGCTTTCGCCTC------------GACCTGCTGAAC
241242243244245246247248249250251252253254255256257258259260261262263264
W E S D V V G S G F L A Q A M N I L E G S R Y T
W E S D - - - - - - - - - - - - - - - - - - - -
TGGGAATCCGAC------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S R P T E G K Y A G A F I M D V S E F M P G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E P N V V L V R S G G T A M Y A A K D I G Y Q F
- - - - - - - - - - - - - M Y A A K D I G Y Q F
---------------------------------------ATGTACGCCGCCAAGGACATCGGCTACCAGTTC
313314315316317318319320321322323324325326327328329330331332333334335336
W K F G L F E G M K F K P F M Q D P E G N T I W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T S A P D G Q P D D E R R F G H A Q E V I N V I
- - - - - - - - - - - - - - - - - - - - I N V I
------------------------------------------------------------ATCAACGTGATC
361362363364365366367368369370371372373374375376377378379380381382383384
D S R Q D H P Q T V V R S A L G V A G E Q E K E
D S R Q D H P Q T V V R S A L G V A - - - - - -
GACTCGCGCCAGGACCACCCGCAGACGGTGGTGCGTTCGGCGCTGGGTGTGGCG------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E R S I H L S Y A F V T L E G Q T I S G R K G I
- - S I H L S Y - - - - - - - - T I S G R - - -
------AGCATCCACCTCTCCTAC------------------------ACCATCAGCGGGCGC---------
409410411412413414415416417418419420421422423424425426427428429430431432
A V S A D D A M D E A Q K R A L S V L Q G I N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D L A A R E D A A E I A R R I G L G A I R F A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L K A E P T R K I D F R W E Q A L A L N G D T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P Y V Q Y A A V R A A N I L K K A E E A G Y A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D G T G A D W D A L P D I D L V L A K Q I A K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P E V A A Q A A R I H S P H V V A Q Y A L D L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
T S F N A W Y N A K T K Q G K P A T N V L Q S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E G L R E A R L A L I V R L R K A F E D T L D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609
I G I E I P A A M
- - - - - - - - -
---------------------------
Class I
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_arg_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E D L K D I C A Q A M H T V L G D H I A P L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A Q E G W K E S M L G V F T S P L V T P T T N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K Y G H Y Q F N S T M G I A K L I K D L H Y D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L P S N P A E L S G L F T Q A M L C V Q D K Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E K G C P K P I E A V N I A G C F I N I A L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P A Y L L S K C F D I Y M A V P F G T L P K P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T L P R K R V V V D F S S P N V A K S M H V G H
- - - - - - - V V D F S . P N V A K S M H V G H
---------------------GTCGTCGACTTTTCG---CCTAACGTGGCAAAGTCTATGCACGTGGGTCAC
169170171172173174175176177178179180181182183184185186187188189190191192
L R S T I I G D S I C R L Y E Y V G Y D V H R I
L R S T I I G D S I C R L - - - - - - - - H R I
CTGCGATCAACGATTATCGGGGACTCTATTTGCCGTCTC------------------------CACCGCATC
193194195196197198199200201202203204205206207208209210211212213214215216
N H V G D W G T Q F G M L I T H L T D M H P E I
N H V G D W G - - - - - - - - - - - - - - - - -
AACCACGTGGGCGACTGGGGC---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A D A A A H C R R I T M L P I D N L V A F Y K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A K E R F D N D P A F Q K R A Y E A V V K L Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L N L A E F Y L W C K I C D I S R H E F Q R I Y
- - - - - - - - - - - - - D I S R H E F Q R I Y
---------------------------------------GACATCTCTAGGCACGAGTTTCAGCGCATTTAT
289290291292293294295296297298299300301302303304305306307308309310311312
D R L D I K I D E F G E S S Y K F K L G T T V A
D R L D - - - D E F G E S S - - - - - - - - - -
GATCGCCTAGAC---------GATGAGTTTGGAGAGAGTTCC------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R L K R L H L T Q M S D K A T V I P I E G M D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P L I I V K S D G G F T Y D T T D M A A I Y H R
- - - - - - - - - - - T Y D T T D M A A I Y - -
---------------------------------ACTTACGACACAACAGACATGGCAGCTATTTAT------
361362363364365366367368369370371372373374375376377378379380381382383384
T Q V L H A D K C V Y V V D A G Q S S H F D L V
- - - - - - - - - V Y V V D A G Q S S H F D L V
---------------------------GTGTACGTTGTTGACGCCGGCCAGTCGAGTCACTTTGATCTTGTT
385386387388389390391392393394395396397398399400401402403404405406407408
F K A A E K A G W I T K D Q A V H V P F G V V L
F K A A E K A - - - - - - - A V H V P F - - - -
TTCAAAGCTGCTGAGAAGGCT---------------------GCCGTGCACGTCCCATTC------------
409410411412413414415416417418419420421422423424425426427428429430431432
G S D G K R L K T R A G E T V K L E D L L D E A
- - - - - R L K T R - - - - - - - - - - - - - -
---------------CGCCTCAAAACAAGA------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V T E S M R L L E E R N R D Q E F S Q E E M R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V A E A V G Y G A V K Y A D L S S H R I K D Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y D P K R M L N L K G N T A A Y L L Y S F T R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S S I C R K A G I D R E E L Y T S D T L R N L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I T E P S E I N L L V A L L K V R D T I L F T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E D L C P H R I C D W V Y S V A S A Y T D F Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K C R V I E T S A S G D S V C N K S R L V L C E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621
M A R Q S L R L A F H L L G I R E I D R M
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_arg_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A S A A P A Q T L G Q F T S T A K R V P S V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T D L A G V F S T A L R T A F P N V D I Q P A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A A T N N R D H G D Y Q C N N A M A L F G R M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G K E G A P K N P R E V A T A I L N A L P D T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A I D G T P T L A G P G F I N I K L S S A W L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E R I Q I L V K Q R A V V D F S S P N V A K E M
- - - - - - - - - - - V V D F S . P N V A K E M
---------------------------------GTGGTGGATTTCTCA---CCCAATGTGGCCAAGGAGATG
145146147148149150151152153154155156157158159160161162163164165166167168
H V G H L R S T I I G D T I A R T L E F C G V D
H V G H L R S T I I G D T I A R T - - - - - - -
CATGTGGGCCACCTGCGATCCACCATTATCGGAGACACCATCGCGCGCACG---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T L R I N H V G D W G T Q F G M L I Q H I A E T
- L R I N H V G D W G - - - - - - - - - - - - -
---CTGCGTATCAACCATGTGGGCGACTGGGGC---------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R P G G L Q G T T T E E V S D L Q T L Y K A S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A R F D A E E D F K A R A R E A V T R L Q S G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P E F L E T W K R I C E A S R N E F D A I Y H R
- - - - - - - - - - - E A S R N E F D A I Y H R
---------------------------------GAGGCCAGCCGCAACGAGTTTGACGCCATCTACCATCGA
265266267268269270271272273274275276277278279280281282283284285286287288
L D V H I L W R G E S W Y N P R L T P L V E E L
L D - - - L W R G E S W - - - - - - - - - - - -
CTGGAC---------TTGTGGCGGGGGGAGTCATGG------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I E R G I A E E S E G A K V I T V E G L K T P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
M I R K S D G G Y G Y G T T D M A T L A Q R I H
- - - - - - - - - G Y G T T D M A T L A - - - -
---------------------------GGCTATGGGACCACCGACATGGCCACCCTGGCT------------
337338339340341342343344345346347348349350351352353354355356357358359360
D E K A E W L I Y V T D E G Q S G H F K L V F G
- - - - - - - I Y V T D E G Q S G H F K L V F G
---------------------ATTTATGTGACGGACGAGGGCCAGTCGGGGCACTTCAAGCTGGTGTTTGGC
361362363364365366367368369370371372373374375376377378379380381382383384
A G K R A G I I P A K N P P R I D H V G F G L V
A G K R - - - - - - - - - - - I D H V G F - - -
GCGGGCAAGCGC---------------------------------ATCGACCACGTTGGCTTC---------
385386387388389390391392393394395396397398399400401402403404405406407408
L G Q D G K R I R T R D S G A A V R L V E L L D
- - - - - - R I R T R - - - - - - - - - - - - -
------------------CGGATCCGTACCCGT---------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E A K A R C A A S I K E R Q E T T I E R G G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L S A E E M E N I S S V M G Y G A V K Y A D L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N N R A T N Y K F N F D E M L D L K G N T A V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M L Y A H A R I A G I I R K S N K D I K E V A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T A H I S L D H A S E R A L A L H I V R F T E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L E D T L V E L A P N R I T E Y V Y E L S N Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
N T F Y V G C K V L G E K E E D S R L L L C E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596
T A M I M R Q C F Q L L G I K P L Y R I
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_arg_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M C A A A A T V N V E L A L K E I V K A T I A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A F P L V P A Q E P L I T L G K V S E Y Q C N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A M G L V K V L S Q Q Q Q P I K M S P Q M V G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E L K K N L V G N D I I D E F E P T P K G F I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V S I R K E W V A R M V K E V L K Q G I R P P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V T K Q R V L V D F S A P N I A K E M H V G H L
- - - - - - L V D F . A P N I A K E M H V G H L
------------------CTCGTCGACTTT---GCGCCGAACATTGCCAAGGAGATGCATGTCGGACATCTG
145146147148149150151152153154155156157158159160161162163164165166167168
R S T I I G E S I S R L L E F C Q H D V A R I N
R S T I I G E S I S R L - - - - - - - - A R I N
CGCTCCACCATCATCGGCGAGTCGATCAGCCGCCTG------------------------GCACGCATCAAC
169170171172173174175176177178179180181182183184185186187188189190191192
H I G D W G T A F G M L I L Y I K R N F P D Y T
H I G D W G - - - - - - - - - - - - - - - - - -
CACATCGGCGACTGGGGT------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T N P P D I S D L T D F Y R A A K K C F D E D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E F K E K A R L E V V K L Q A L E E D S I Q A W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K Y I C D V S R E E F D K V Y T R L G A T I E E
- - - - D V S R E E F D K V Y T R L G - - - E E
------------GACGTGTCGCGCGAGGAGTTCGACAAGGTTTACACCCGCCTCGGC---------GAGGAG
265266267268269270271272273274275276277278279280281282283284285286287288
R G E S F Y N P L I P K V L D L L E E A G Q I E
R G E S F - - - - - - - - - - - - - - - - - - -
CGCGGTGAGAGCTTC---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V S D G A K L I V S K E A R K L D S L D A R D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T K L A S Q H L A L V S R D G P S Y H P N L L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A M K K A G I L T G T E G E E S V A L S K K E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K P W N K F D I R V D L D K L M A Q L A P L Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K Q L D P L F L E V F E A A G I V K G D S I L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P R F S F P L M V V K S D G G Y T Y D T T D V T
- - - - - - - - - - - - - - - - T Y D T T D V T
------------------------------------------------ACCTACGACACGACAGATGTCACG
433434435436437438439440441442443444445446447448449450451452453454455456
A T Y H R F V I E K M N R V I Y C T D L G Q Y E
A T Y - - - - - - - - - - - I Y C T D L G Q Y E
GCCACGTAC---------------------------------ATCTACTGCACCGATTTGGGCCAGTACGAG
457458459460461462463464465466467468469470471472473474475476477478479480
H F R M C M Q T A K D M G W M E H A T W D H A G
H F R M C M Q T A K D M - - - - - - - W D H A G
CACTTCCGCATGTGCATGCAGACGGCAAAGGACATG---------------------TGGGACCACGCCGGC
481482483484485486487488489490491492493494495496497498499500501502503504
F G L V T G A D G K K I K T R S G E T V K L K D
F - - - - - - - - - K I K T R - - - - - - - - -
TTT---------------------------AAGATAAAGACGCGC---------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L M D E A V E R S L A I L K E R E A G E R S Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
H S E E E M Q K L S N I I G I G A I K Y F D L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q T R T G D Y A F S Y D K M L D M S G N T A V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L L Y Q Y A R I C S I K R K A G I A D E E L L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I T D I S L E T P Q E K S L A L C A L R F Q T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
I L K T V E D L F P H H L A D F A Y E L M T N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S N F F Q N C R V L D D P L Q N S R L C L V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692
T R I T L K K T L E L L N I E T A E R I
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_arg_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L G I A Q E L N N L L L T A M E N M F P E A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I L A T D S G K P L D P Q L I I A S K P E F G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F Q V N G P L A L S K I L G K P P R K I A T D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V N A L L A I P S F S E L C S P P I I A G P G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I N L V L K P E L L K S E I R K V L S N P N I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V P N V T E T E D H L F P V I I D F S S P N I A
- - - - - - - - - - - - - - I I D F S . P N I A
------------------------------------------ATAGCTAGTGATCCG---TTGACTAAGGTC
145146147148149150151152153154155156157158159160161162163164165166167168
K D M H V G H L R S T L I G D C L A R I L E F R
K D M H V G H L R S T L I G D C L A R I - - - -
TGCATATTTTACGGCAGCTATACCAACTTTCTTTGAAACATCTTTAATAAAAATCTCTTC------------
169170171172173174175176177178179180181182183184185186187188189190191192
G Y N V L R L N H V G D W G T Q F G M L I T H L
- - - - L R L N H V G D W G - - - - - - - - - -
------------ACGTTTACGTAAATCTATATCAGCACGTTC------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K Q V A P Q A L I N P D V I E L G D L V A F Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q A K N R F D N D Q S F Q I A S R E E V V R L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S G D P D S R K A W Q L L C D Q S R R E F Q V I
- - - - - - - - - - - - - - D Q S R R E F Q V I
------------------------------------------TTCAAAAATTACCCCAAATCTATAACGAAT
265266267268269270271272273274275276277278279280281282283284285286287288
Y D R L D I T I T E R G E S F Y N S Y L E E V I
Y D R L D - - - T E R G E S F - - - - - - - - -
GGCAGCAAGATCCGT---------ATTGAAGCCACCATCACTCTT---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L D L D A L D L L V T D E G A R C V F L E G V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G K S N K P L P V I I Q K S D G G F N Y A T T D
- - - - - - - - - - - - - - - - - - N Y A T T D
------------------------------------------------------AGTAATAGTAATATCGAG
337338339340341342343344345346347348349350351352353354355356357358359360
L A A I R Y R F G V I F E G D G A S R I V Y V T
L A A I R - - - - - - - - - - - - - - - V Y V T
ACGATCATAAATTAC---------------------------------------------ACGTGAATCAGG
361362363364365366367368369370371372373374375376377378379380381382383384
D S G Q A N H F A G I F Q I A R R A G W V P T N
D S G Q A N H F A G I F Q I A R R A - - - - - -
ATCACCACTTTGCAGTCTTACCACTTCTTCTCGAGAAGCTATCTGGAAAGATTG------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G R L E H V P F G L V Q G Q D G K K L K T R A G
- - L E H V P F - - - - - - - - - K L K T R - -
------TTGTCTATAAAATGCAAC---------------------------ATTGATCAGTGCCTG------
409410411412413414415416417418419420421422423424425426427428429430431432
D T V R L K D L L D E A I E R A D I D L R K R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A E E N R S E E E I F I K D V S K K V G I A A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K Y A D L S Q N R I T S Y Q F N F D R M L S L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G N T A P Y L L Y A M V R I A G I L R K S S K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H D T L E K Q L H F S E P I E W A L V R H I L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F D L I I I E V E E E L L P S R L C S Y L F E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
S Q L F N R F Y D Q V P V L K A K E P N L S S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L I L C Q L T A D T L K M G L N L L G I P T L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602
R M
- -
------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_arg_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_arg_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F L D K I L E D V V E E I E K L K I L T K E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I R T C L T I T N V S G K P H C T L F L P K L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L Q N L D I N D L Y S H F K T A K F L L I K D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T T F K S S I S F N I N L I P Y S Y E I L T T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E K G E D F G R N N I G N G E T V V I D Y S S
- - - - - - - - - - - - - - - - - - V I D Y S .
------------------------------------------------------GTAATTGATTACAGT---
121122123124125126127128129130131132133134135136137138139140141142143144
P N I A K I F H M G H F R T T I L G N F V K K I
P N I A K I F H M G H F R T T I L G N F V K K I
CCAAATATTGCGAAAATCTTTCATATGGGACACTTTCGAACTACAATTTTAGGAAATTTTGTAAAAAAAATT
145146147148149150151152153154155156157158159160161162163164165166167168
H A F C G Y K A V G I N Y L G D W G K Q F G L V
- - - - - - - - V G I N Y L G D W G - - - - - -
------------------------GTTGGTATTAATTATCTCGGTGACTGGGGT------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L G S Q R F S N P E E L K T D P I K Y L F N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y V Q I S Q A K A T D P S V D V E A K K I F E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
M E K G T D S S L L D K W S H F R E L S I N K Y
- - - - - - - - - - - - - - - - - E L S I N K Y
---------------------------------------------------GAATTAAGCATTAACAAATAC
241242243244245246247248249250251252253254255256257258259260261262263264
K E L Y S K L G V E F E E Y S G E S F Y E K T C
K E L Y S K L . . E - - E Y S G E S F - - - - -
AAAGAGTTATACAGCAAATTG------GAA------GAATATTCTGGAGAAAGTTTT---------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q D D I K K C N F L I K N S D G S V C L D L G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E K N P L V I K S D G T S L Y L T R D F S A A K
- - - - - - - - - - - - - L Y L T R D F S A A K
---------------------------------------CTTTATCTAACTAGAGATTTTTCTGCTGCTAAA
313314315316317318319320321322323324325326327328329330331332333334335336
D R I A R Y N P K K L I Y V V S S E Q K E H F E
- - - - - - - - - - - I Y V V S S E Q K E H F E
---------------------------------ATTTATGTTGTTTCAAGCGAACAGAAAGAACATTTTGAA
337338339340341342343344345346347348349350351352353354355356357358359360
D L F A T L R K A E I F D N L E H V Q Y G M V S
D L F A T L R K A - - - - - L E H V Q Y - - - -
GATTTATTTGCTACTTTACGTAAAGCG---------------TTAGAACATGTACAATAT------------
361362363364365366367368369370371372373374375376377378379380381382383384
G M S T R K G T V K F L E D I I D I A T D V M M
G M S T R - - - - - - - - - - - - - - - - - - -
GGAATGTCTACACGT---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K Q I D A N P E K K A Q I K D V S A T A L N L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V S T L I I M D F S A K R I K G Y K F D V E K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A M N T K G T G I Y I Q Y A H C R L K S I E D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N K D I D L N K D I K I D S K C L E Q E E I L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L L Y Q F I W F E K V V I S S F K D N E P N K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F T Y V S N L C W L T N S Y N S S L K V K G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P S V A K T R L Q V L K C A R L I I G T T L K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561
F G L T P L N K M
- - - - - - - - -
---------------------------
Class I
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_cys_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G V R I Y N T A T R Q V E E F V T Y V P K L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R G Y V C G I T P Y D H V H V G H G R V Y V F F
R G Y V . G I T P Y D H V H V G H G R V Y V F F
CGCGGCTATGTA---GGCATAACGCCATACGACCACGTCCACGTAGGCCACGGGAGGGTGTACGTCTTTTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D M F R R Y L E A R G Y E V R L V I N F T D I D
D M F R R Y - - - - - - - - R L V I N F T D I D
GACATGTTTAGGCGCTAC------------------------CGATTAGTGATAAACTTTACGGATATAGAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K I I N K A R E E F G H D A Y K R W K E V P E
- - - - - - - - - - - - - - - - - - - - - - - E
---------------------------------------------------------------------GAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R Y I A E F F E M S N K L F I K P A H A Y P R V
R Y I A E F F E M S N K L . . . . . H A Y P R V
AGATATATAGCAGAATTCTTCGAAATGTCCAATAAGCTC---------------CATGCATATCCCAGAGTT
121122123124125126127128129130131132133134135136137138139140141142143144
T E N V N E M V A W I S T L V E K G Y A Y V A P
T E - - - - - - - - - - - - - - - - - - - - - -
ACAGAG------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D G S V Y F E V G K V P N Y G V L S R Q K I E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L I A G A R V E P E P G K K N P L D F A L W K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W T P G E P W W N S P W C P G R P G W H L E C V
- - - - - - - - - - - - - - - - - G W H L E C V
---------------------------------------------------GGGTGGCATTTAGAGTGCGTC
217218219220221222223224225226227228229230231232233234235236237238239240
V M S T K Y L G A P F D F H G G G A D L I F P H
V M S T - - - - - - - - F H G G G A D L I F P H
GTAATGTCGACG------------------------TTCCACGGCGGTGGGGCGGATTTGATATTCCCCCAC
241242243244245246247248249250251252253254255256257258259260261262263264
H E N E I A I A K A Y Y G L D N F A K Y W I H V
. E N E I A I A K A Y - - - - - - A . Y W I H V
---GAGAACGAAATTGCAATAGCCAAGGCGTAT------------------GCA---TACTGGATACACGTG
265266267268269270271272273274275276277278279280281282283284285286287288
G Y L T V R G E K M S K S L G N V I T L R E V L
- - - - - - - - K M S K S - - - - - - - - - - -
------------------------AAAATGTCCAAGTCT---------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S K Y S G E A L R L A Y A M S H Y R K P M E F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F E L L D Q A E E M V K T L Y T A Y D E L S Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V A D A S D E D K E K L E Y G K Y I E S F Y A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L E D D F S T P Q A A Q Q L Y G L A R Y I I S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V L H R I D K A S R Q T A I D V L T Q Y V K M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D I L G V L E R R E I P K E V E E V I K A V V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A R A R L R R E K M Y Q L A D Y L R E R L A G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474
G V E L H D F G Q R T Y Y T Y K R R
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_cys_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S Q S F S M I K W S G K P T I R V R N T M G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R L E E F K P L K P G I V R M Y V C G P T V Y D
- - - - - - - - - - - - - R M Y V . G P T V Y D
---------------------------------------CGCATGTACGTA---GGTCCTACAGTTTACGAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y T H I G H A R T Y V A F D A I K R Y L V L R G
Y T H I G H A R T Y V A F D A I K R Y - - - - -
TACACACACATTGGGCACGCGAGAACATATGTGGCCTTCGATGCCATAAAACGGTAT---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y H V I H V Q N I T D I D D K I I N R A Q R E N
- - - I H V Q N I T D I D - - - - - - - - - - -
---------ATACACGTGCAGAACATAACAGACATAGAT---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R D W R E I V D E Y S R D Y F D M L K K L N I K
- - - - - - - D E Y S R D Y F D M L K K L . . .
---------------------GACGAGTATAGCCGCGACTACTTCGACATGCTGAAGAAGCTC---------
121122123124125126127128129130131132133134135136137138139140141142143144
V H I H P R V T E H I K E I I D F I Q G L I D K
. H I H P R V T E - - - - - - - - - - - - - - -
---CACATACACCCGCGCGTAACAGAA---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G Y A Y V A P S G S V Y F N V D A Y P E Y G S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S G R F H P E D W R Q E E D V L R E K K N P Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F A L W K A W K P G E P Y W E A P W G R G R P G
- - - - - - - - - - - - - - - - - - - - - - - G
---------------------------------------------------------------------GGC
217218219220221222223224225226227228229230231232233234235236237238239240
W H I E C S V M S S R Y L G E Q F D I H G G G Q
W H I E C S V M S S - - - - - - - - I H G G G Q
TGGCACATAGAGTGCAGCGTGATGTCTTCG------------------------ATTCACGGCGGAGGCCAG
241242243244245246247248249250251252253254255256257258259260261262263264
D L I F P H H E N E K A Q S E A Y F S K K P W V
D L I F P H . E N E K A Q S E A Y - - - - - - V
GACCTAATATTTCCACAT---GAGAACGAAAAGGCACAGAGCGAGGCCTAC------------------GTC
265266267268269270271272273274275276277278279280281282283284285286287288
K Y W L H T G Y L T I R G E K M S K S L G N I I
. Y W L H T - - - - - - - - K M S K S - - - - -
---TACTGGCTCCATACC------------------------AAAATGAGCAAAAGC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
P F R E A A K K W N P S V L R M W L L S A H Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T Q L D F S E E S L A Q A E A N L R R I R G T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S E L A R M L E R A T P E G R I S D D E L K A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E D T S H A Y L E F H E A M S N D F N T A A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A S I L K L T R L V N S T I I P G E Y Y T A G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L A L R L Y E E F N S V F S V I D D V L Y G S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A P G G E T V E K L I E L I V S V R Q E L R K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R I Y D I A D S I R S E L S Q L G I R L Y D H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489
G G K T T W R I E
- - - - - - - - -
---------------------------
Class I
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_cys_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T L R I Y N T L T K Q K E E F K P I N E G E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R M Y V C G P T V Y D Y P H L G H A R T Y I A F
R M Y V . G P T V Y D Y P H L G H A R T Y I A F
TTCTCTAATTTT---TGCAAGCTCAAACTTCCTCTCCTTTCTAAGCTCGGCCCTAACTTGAATTAAAAGCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V I R R Y L E H K G Y S V L M V M N F T D I D
D V I R R Y - - - - - - - - L M V M N F T D I D
TATAAGCTTCTCTTCTTC------------------------TTCCTCAAAGATCCCGAAAATTTCTCCAAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K I I R R A K E T G E D P A K L A E K F I K V
- - - - - - - - - - - - - - - - - - E K F I K V
------------------------------------------------------TTCCGTTATATATTTGTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F L E D M K A L K V K P A D I Y P R V T E H I E
F L E D M K A L . . . . . D I Y P R V T E - - -
TATTGCATTGCTAACCTCAAATAC---------------CGCTGTATTAAAATCATCATCCAT---------
121122123124125126127128129130131132133134135136137138139140141142143144
D I I Q F I E R L K E K G Y A Y E G S D G V Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E V Q K F K E Y G K L S G V K L E E L R K G A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V E P G E G K K N P E D F A L W K K A K P G E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K W E S P W G E G R P G W H I E C S V M S S K Y
- - - - - - - - - - - G W H I E C S V M S S - -
---------------------------------GAAATTACCCAAGCTCTTACTCATCTTCTCCCC------
217218219220221222223224225226227228229230231232233234235236237238239240
L G E S F D I H G G G N D L I F P H H E N E I A
- - - - - - I H G G G N D L I F P H . E N E I A
------------------AAGCCAATAATGGACCCATTCGTGACCAAAGCAGGC---GCTCTGGGCTATCTC
241242243244245246247248249250251252253254255256257258259260261262263264
Q S E A C F G H E W V H Y W L H T G F V M V K G
Q S E A C - - - - - V . Y W L H T - - - - - - -
ATTCTCATGGTGAGG---------------TCC---ACCATGTATATCAAA---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E K M S K S L G N F V T V R E L L Q R Y S P E V
- K M S K S - - - - - - - - - - - - - - - - - -
---CATAACTGAACACTC------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I R F F V L Q K H Y R S P L D Y S E E G L Q H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K N N L E R L Y N T L E N I R I A M E N A E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y T W D E N D F K A Y N S I K E A R R K F Y E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
M D D D F N T A E A L K A V F E V S N A I N K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I T E A E K P K E S V L R K A W E F F R T V G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I F G I F E E Y F K E E K A K E E E K L I E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I Q V R A E L R K E R K F E L A D K I R E E L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476
K L G I Q L E D K G K E T I W K R I K V
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_cys_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G Q R L E V F E P L E P G I V R M Y V C G P T
- - - - - - - - - - - - - - - - R M Y V . G P T
------------------------------------------------GTCGTAGAGCCT---CCCCAGCCG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V Y D Y T H L G H A R T Y V A F D A I K R Y L A
V Y D Y T H L G H A R T Y V A F D A I K R Y - -
CGCTAGCTCCGATCTTATGGAGTCTGCCAGGTCGAATAGCCTTCTCTTCCTCAGCTCCTGGCGCAC------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L R G Y S V I H V Q N I T D I D D K I I D R A R
- - - - - - I H V Q N I T D I D - - - - - - - -
------------------CTCAGTCATCTCTGCCGCCGGCGCCCCGGC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R E G R D W R E I V D T Y S R D Y F E M L Q K L
- - - - - - - - - - D T Y S R D Y F E M L Q K L
------------------------------GCGGAGGGCGAGAAGCCCTGCCGTGTAGTACTCGCCGGGTAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K I S V H I H P R V T D H I K E I I E F I Q G L
. . . . H I H P R V T D - - - - - - - - - - - -
------------GGTTATCCTGGTCAGCTTTAGGAC------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I D K G Y A Y V A P S G S V Y F D V D A F P G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G E L S G R F H P E E W R Q E E D V L R E K K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P Y D F A L W K A W K P G E P Y W E A P W G R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R P G W H I E C S V M S S K Y L G E Q F D I H G
- - G W H I E C S V M S S - - - - - - - - I H G
------GCTCGGGCTCCACTTCTTCGAGGCCTCCCGGAA------------------------GCTCATCTT
217218219220221222223224225226227228229230231232233234235236237238239240
G G Q D L V F P H H E N E R A Q S E A F F G K K
G G Q D L V F P H . E N E R A Q S E A F - - - -
CTCCCCGCGTATGGTTAGGTAGCCCGT---GAGCCAGTAGCGTACCCAGGGCTTCTTCCC------------
241242243244245246247248249250251252253254255256257258259260261262263264
P W V R Y W L H T G Y L T I R G E K M S K S L G
- - V . Y W L H T - - - - - - - - K M S K S - -
------GGC---CTCGTTCTCGTGGTG------------------------GCCGTGGATATCGAA------
265266267268269270271272273274275276277278279280281282283284285286287288
N I I P F R E A S K K W S P S V L R L W L L S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H Y R T Q L D F S E G A L E Q A E A N L R R L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G A V S D L A R M L R E A E P R G R L S D K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K A L G E V V D A Y Y G F H E A M S D D F N T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A L A A V L K L T R I T N S T L I P G E Y Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A G L L A L R V Y E E F N T V F A V L D D V L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G A G A P A A E M T E K L V E I I V S V R Q E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R K R R L F D L A D S I R S E L A R L G I R L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472
D H P G G K T T W R I E R M G D
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_cys_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E G S S K T L R L Y N T L T R S I E P I Y P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E R N R L R L Y A C G P T V Y T Y A H I G N F R
- - - - - R L Y A . G P T V Y T Y A H I G N F R
---------------CGGCTGTATGCC---GGGCCCACGGTCTACACGTACGCCCACATCGGCAACTTTCGA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S F L T A D L I V R V A Q A L G W Q T V Y V C N
S F L T A D L I V R V - - - - - - - - V Y V C .
AGCTTTCTGACGGCCGACCTGATCGTACGCGTG------------------------GTCTACGTCTGC---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I T D V G H L T V D D Y A D A S G E D K L E R A
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L R S E E G R R F P N I W D L A R Y Y T Q A F L
. . . . . . . . . . . I W D L A R Y Y T Q A F L
---------------------------------ATCTGGGACCTGGCCCGCTATTACACGCAGGCCTTTCTG
121122123124125126127128129130131132133134135136137138139140141142143144
E D W Q A L K L I E P D V R P R A T E H I R Q Q
E D W Q A L . . . . . D V R P R A T E - - - - -
GAGGACTGGCAGGCGCTC---------------GACGTCCGCCCCCGGGCCACCGAG---------------
145146147148149150151152153154155156157158159160161162163164165166167168
I L A I E Q L V K T G H A Y E T R Q G V Y F H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P S F P D Y G K L S G N R D P E Q L A R A V R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V V Q D P E K R D P R D F A L W K K D E K H L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q W Y S P W G W G F P G W H I E C S V M S M E Y
- - - - - - - - - - - G W H I E C S V M S M - -
---------------------------------GGCTGGCACATCGAATGCTCGGTCATGTCCATG------
241242243244245246247248249250251252253254255256257258259260261262263264
L G E T F D L H L G G E D L I F P H H E C E I A
- - - - - - L H L G G E D L I F P H . E C E I A
------------------CTGCACCTGGGCGGCGAAGACCTGATCTTTCCCCAT---GAATGCGAGATTGCG
265266267268269270271272273274275276277278279280281282283284285286287288
Q A E S L T G K P L A R Y W V H T R F L L V E G
Q A E S L - - - - - A . Y W V H T - - - - - - -
CAGGCCGAAAGCCTC---------------GCC---TACTGGGTGCATACC---------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E K M S K S K G N F F T V R E L I L P P E A G G
- K M S K S - - - - - - - - - - - - - - - - - -
---AAGATGTCCAAGTCG------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q G I D P M A L R Y A L I S G K Y R E P L N F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R K H L A D S V R I V R R Y Q E A A Q R V E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L Q G D R S G P D R L G D R L S T I Y D G T L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A L C D D L N T P V A L A T A L E G V K L I L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F G D Q L N R A S A E S A Q R W L Q Q I D A L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G F V Y P P K R P C S H L R P E T D P F V E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E R L L A E R D A A R R A R D F A R A D A I R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q L L Q M G I E V M D T P E G T R W R R K V L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_cys_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R L Y N T L G R R I E T F E S F D P L T V K M
- - - - - - - - - - - - - - - - - - - - - - K M
------------------------------------------------------------------AAAATG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y V C G P T V Y D Y V H I G H G R A F V G F D G
Y V . G P T V Y D Y V H I G H G R A F V G F D G
TATGTT---GGTCCTACGGTTTATGACTATGTTCATATAGGTCATGGTAGAGCATTTGTGGGTTTCGATGGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I V R Y L K L R G F N V I R V Q N I T D I D D K
I V R Y - - - - - - - - I R V Q N I T D I D - -
ATAGTGAGATAC------------------------ATAAGAGTTCAAAACATTACCGATATAGAC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I I K R A N E T G K D W R E I V D Y Y T K D Y M
- - - - - - - - - - - - - - - - D Y Y T K D Y M
------------------------------------------------GATTATTACACAAAGGACTACATG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E S L K A L K V E I D Q H P R V T S H I Q E I I
E S L K A L . . . . D Q H P R V T S - - - - - -
GAGTCGCTTAAAGCTTTG------------GATCAACATCCTAGAGTAACCAGT------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D F V Q K L V D K G H A Y T T S S G S V Y F D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D S F P S Y G L L S G S K K E E W N Q G E E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K E K K N P Y D F A L W K A W K P G E P Y W E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P W G K G R P G W H I E C S T M S T R Y L G E Q
- - - - - - - G W H I E C S T M S T - - - - - -
---------------------GGCTGGCATATTGAATGCTCCACAATGTCAACT------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F D I H G G G V D L V F P H H E N E R A Q S E A
- - I H G G G V D L V F P H . E N E R A Q S E A
------ATCCACGGTGGAGGTGTGGATCTAGTCTTTCCTCAC---GAGAATGAAAGGGCACAGAGTGAGGCT
241242243244245246247248249250251252253254255256257258259260261262263264
L L G K T W V K Y W V H V A Y L T I N K E K M S
L - - - - - V . Y W V H V - - - - - - - - K M S
CTA---------------GTT---TACTGGGTTCATGTA------------------------AAGATGAGT
265266267268269270271272273274275276277278279280281282283284285286287288
K S L G N I I P L N E A L K K W G P S V L R F W
K S - - - - - - - - - - - - - - - - - - - - - -
AAGTCG------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y L S T K Y R N S I D Y S E Q T L E Q A R S S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q R L K D A M G I I R S V I K E E P K S H S N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E E I S T Q R E I I S L I G K F H E A M S N D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D T A T A L S N I Y E I A N L V F T K I Q Y T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D F M G A M L A F G A F R Q F N Y V F G V M D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E F N P S Y E V M Y K V I D S V V E I R N I L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A M K M Y D L S D E I R S V L A N A G I K I L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466
G K E K S T W R F E
- - - - - - - - - -
------------------------------
Class I
Archaea/Staphylothermus marinus/Smarinus_cys_aa
Archaea/Staphylothermus marinus/Smarinus_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y G I K I Y N T L T R K I E E F K P V S P G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V K M Y V C G P T V Y D Y N H I G H G R V Y V V
- K M Y V . G P T V Y D Y N H I G H G R V Y V V
---TATACGGTCAGC---ATCATATAGTTTTCTTTCACGAAGCTCCCTTCTAATATCTACAACTATATTGAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y D A L K R Y L A L R G Y H V L H V M N I T D I
Y D A L K R Y - - - - - - - - L H V M N I T D I
CACATTATCTAGGAGGGTTTC------------------------ATATTTATCTAGAACTCCCAGTACTGT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D D K I I N R A H Q E K R D W R E I A E T Y T R
D - - - - - - - - - - - - - - - - - - E T Y T R
ATT------------------------------------------------------TTGTATCTCCTTAAA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D Y L E S L G K L N V K V D L H P R V T E H I K
D Y L E S L G K L . . . . D L H P R V T E - - -
CACTAGAGTCATAAACTCGCTTATCAC------------CGGTGTGTTGAAATCATTCGATAA---------
121122123124125126127128129130131132133134135136137138139140141142143144
E I I E F I Q I L I D K G Y A Y V A P S G S V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F E V D K Y P E Y G E L S G R T N K E L W S Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K E F I S E K K K P Y D F A L W K A W K P G E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
H W D A P W G K G R P G W H I E C S V M S S R Y
- - - - - - - - - - - G W H I E C S V M S S - -
---------------------------------AATGTTTCCCAAGCTCTTACTCATCTTCTCACT------
217218219220221222223224225226227228229230231232233234235236237238239240
L G R Q F D I H G G G T D L I F P H H E N E R A
- - - - - - I H G G G T D L I F P H . E N E R A
------------------AACCCAGTACTTCACCCAAGGCTTCACACCAAATGC---TTCACTTTGTGCTCT
241242243244245246247248249250251252253254255256257258259260261262263264
Q S E A A F G V K P W V K Y W V H T G M V M M G
Q S E A A - - - - - - V . Y W V H T - - - - - -
CTCATTCTCATGGTG------------------TCC---ACCATGAATATCGAA------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S E K M S K S L G N I I P L R E A F K E W G P E
- - K M S K S - - - - - - - - - - - - - - - - -
------CATAACGCTACATTC---------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T L R L W Y L T S H Y R R P L V F T E E S I R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A Q K Y Y E R L V S V T N T I K K L S R E A V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L H R M N D E D L K I L E K L L E I R S R F H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A L S N D F N T P Q A L A V I S E F M T L V F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I Q Y N P K Y M L V L T A Y K L L R E F N T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L G V L D K Y L V E T P E E L E T L L D N V I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I V V D I R R E L R E R K L Y D L A D R I R S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477
L G K H G I I L M D R G K E T T W M R R K
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_cys_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R F Y N T L T R D V D E F K E M N S G R I N M
- - - - - - - - - - - - - - - - - - - - - - N M
------------------------------------------------------------------TATTCG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F V C G P T V Q D H F H I G H A R T Y I F F D A
F V . G P T V Q D H F H I G H A R T Y I F F D A
ATCAGC---CTGGAATTTCCTCTCTGTCCTGAGATTCTTTCTCAGATCCAATAGATCATCTATTATGCCGGA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V A K L L R N L G Y S V F Y L Q N I T D I D D K
V A K L - - - - - - - - F Y L Q N I T D I D - -
GAGGCGGGCAGT------------------------GCTGTCAACCCATCTGAAAACATCAATCGC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I I N K A R E M N I Q P Q D V A D M Y L R E F L
- - - - - - - - - - - - - - - - D M Y L R E F L
------------------------------------------------AAAATCGATAAGGTCTCTGAATAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E D M S A L K V T S V N Y F A K S T L Y I N E I
E D M S A L . . . . . N Y F A K S T L - - - - -
CGACCTGAAATCGAAGTC---------------CACCATTCTTTTGATAACGGCAGA---------------
121122123124125126127128129130131132133134135136137138139140141142143144
I S Q I S R L I E K G Y A Y E T S D G V Y F E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S K F A D Y G Q L S N Q S L D Q I I H G Y R V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V N E N K R N P E D F V L W K K R K P G E P Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D S P W G P G R P G W H I E D T A I T E T Y F G
- - - - - - - - - G W H I E D T A I T E - - - -
---------------------------GTAATGCGATAGGTATTTTCTACCACTTATGGC------------
217218219220221222223224225226227228229230231232233234235236237238239240
P E Y D I H G G G S D L I F P H H E A E I A Q M
- - - - I H G G G S D L I F P H . E A E I A Q M
------------GTGATGCGGGAAGATCAGATCCGATCCTCCGCCATG---GTCGTATTCTGGCCCGAAATA
241242243244245246247248249250251252253254255256257258259260261262263264
R A I S G R K Y L S H Y W I H T G M I N V N N E
R A I - - - - - - S . Y W I H T - - - - - - - -
TGTCTCTGT------------------ATG---GCCAGGCCTTCCCGG------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K M S K S L K N F V T I R E V L K E Y R P E D L
K M S K S - - - - - - - - - - - - - - - - - - -
TTCTCCTGGCTTTCT---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R Y A L L N A N Y R T Q L D F S K G L L E E S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K Q V E Y L N S T F R K L V N A S G N S D L S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D P S A V I K R M V D E A T N D F D F R S V F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D L I D F A G D L N K N I E S I S R P A A Q K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I D V F R W V D S F A G I L L P E T A R L S G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I D D L L D L R K N L R T E R K F Q E A D R I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452
D L L L K N G I H V E D R G D E T I W W
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Archaeoglobus fulgidus/amino acid sequences/cys_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E V Y N T L S R K I E K L E D I V D G K R V K
- - - - - - - - - - - - - - - - - - - - - - - K
---------------------------------------------------------------------AAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M Y V C G I T A Y D Y S H I G H A R S A V F F D
M Y V . G I T A Y D Y S H I G H A R S A V F F D
ATGTACGTT---GGTATCACAGCTTACGATTACTCCCACATCGGCCACGCGAGGAGTGCCGTGTTTTTCGAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V F R R Y L E Y L G Y E V V Y V Q N F T D V D D
V F R R Y - - - - - - - - V Y V Q N F T D V D -
GTTTTCAGGAGGTAT------------------------GTATATGTTCAGAACTTCACGGATGTGGAT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K I I N R A V K E G K T Q K E V A E K F I E E Y
- - - - - - - - - - - - - - - - - E K F I E E Y
---------------------------------------------------GAAAAGTTCATTGAGGAATAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K D M E A L N V K K P T Y Q P K V T E H I P D
L K D M E A L . . . . . T Y Q P K V T E - - - -
CTGAAGGACATGGAGGCTTTA---------------ACGTATCAGCCTAAGGTTACGGAG------------
121122123124125126127128129130131132133134135136137138139140141142143144
I I E F I Q N L I E K G Y A Y V I D G D V Y F H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V P A F E H Y G E L S K Q S L E E L N R H R I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P D E R K R D V K D F A L W K S A K E A D L K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q A V F D S P W G R G R P G W H I E C S V M S A
- - - - - - - - - - - - - G W H I E C S V M S A
---------------------------------------GGGTGGCACATAGAGTGCAGCGTCATGTCGGCC
217218219220221222223224225226227228229230231232233234235236237238239240
K Y L G V P F D I H G G G K D L I F P H H E N E
- - - - - - - - I H G G G K D L I F P H . E N E
------------------------ATCCACGGCGGGGGGAAGGACTTGATATTCCCCCAC---GAAAACGAG
241242243244245246247248249250251252253254255256257258259260261262263264
R A Q S F A R F G V E P V K I W V H N D F I R I
R A Q S F A R - - - - - V . I W V H N - - - - -
AGGGCTCAGAGCTTTGCGAGA---------------GTT---ATCTGGGTGCACAAC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
K G E K M S K S L G N I V R I R D V L Q R Y E G
- - - K M S K S - - - - - - - - - - - - - - - -
---------AAGATGAGCAAAAGC------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E V L R Y F L L T A H Y R S P L D Y T E E A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R A K R A Y E Y L R S A L I N L D M E I A Y L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T F G D R K E G K Q V D V E D Y I R R F E E A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N R D L H T P D A I A V L H E F A G L I N K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y E L S L N Q A E E L Y E A F K R L C G V L G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F E K M E R V P A L S R E D A E K V V E R E R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R K E R N F E L A D A I R D E F A K R G I R L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467
D T P K G T R W R V E
- - - - - - - - - - -
---------------------------------
Class I
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_cys_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T L Y V S N T L S G E R E P F E P L D P D S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L V Y T C G L T V S D D A H L G H A R L W V Q S
L V Y T . G L T V S D D A H L G H A R L W V Q S
TTCGTCCGCTCG---GTAGTTTCCGGCGGTCCGCTCCTCCTCGCGGACCTCCAGGACCAGTTCCACCAGGTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V V V R W L A K A G Y D V R H V Q N F T D V N
D V V V R W - - - - - - - - R H V Q N F T D V N
GTCCGCCAGCGTGACGTC------------------------GCGGAAGCCGAGGACGTCGCCACCGAATTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E K I V A R T G E D D L G D S E A A V A R H Y I
- - - - - - - - - - - - - - - - - - - - R H Y I
------------------------------------------------------------GTGCCGGTTCAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E S V I E D M R A L N L D R S E V Y P R V S E H
E S V I E D M R A L . . . . . E V Y P R V S E -
TGCGGTGGCGAGTTCGAGCAGTGCGCTCAC---------------GAAGTCGTCGTTCATCGCGGCGGT---
121122123124125126127128129130131132133134135136137138139140141142143144
V P E I I D L V E T L I E E G Y A Y E T D G S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y F D V T T F E D Y G K L S G Q K V D E V E P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G P E H E Q R E K R H P A D F A L W K A G G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P A D A N E H R D E S L P P L D H E S G Q T W N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S P W G E G R P G W H I E C S A M S M T H L D D
- - - - - - - - G W H I E C S A M S M - - - - -
------------------------GAACGGTTCGCCGGCGGCCGCCTCGCTCTGGGC---------------
241242243244245246247248249250251252253254255256257258259260261262263264
H I D V H V G G Q D L V F P H H E N E I A Q S E
- - - V H V G G Q D L V F P H . E N E I A Q S E
---------GACGAGGTCCTGACCGCCGACGTGGACGTCGATGTG---GTCGAGGTGGGTCATGCTCATCGC
265266267268269270271272273274275276277278279280281282283284285286287288
A A A G E P F A K Y W L H V R L L E T E D E K M
A A - - - - - A . Y W L H V - - - - - - - - K M
GGAGCA---------------TGG---GCCCTCGCCCCAGGG------------------------GTGGTC
289290291292293294295296297298299300301302303304305306307308309310311312
S S S L G N Y F T V K D A V A E F G A D V V R M
S S S - - - - - - - - - - - - - - - - - - - - -
CAGCGGCGG---------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F L V S T S Y T Q R Q T F S E A T V S E A E E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
W E R L E R A Y D R A V E A A D S P D A Y A T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V D E D L R A A V E S A R E S F T A A M N D D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N S R A A V S A L L E L A T A V N R H A D A A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S F D Y R G L V D A V E T F E E F G G D V L G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R F G D A D E G G D V T L A D D L V E L V L E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R E E E R T A G N Y E R A D E L R D H L E T L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494
V T V E D T D D G V S F R R
- - - - - - - - - - - - - -
------------------------------------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_cys_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q L Y S T L S R M V E P F Q T L Y P D R V S L
- - - - - - - - - - - - - - - - - - - - - - S L
------------------------------------------------------------------CATATC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F V C G P T V Y N Y P H L G H A R T Y V V F D V
F V . G P T V Y N Y P H L G H A R T Y V V F D V
AGCGAT---GAACTGTTTTGAGGCACGTAATTCTGCCCTGATATCCTGAAGGATACTGAGCGGAGCACTGGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L A K Y L R W T G Q E V L Y I Q N I T D V D D K
L A K Y - - - - - - - - L Y I Q N I T D V D - -
TTCGGGGAGGAA------------------------TTCAATTAACGCTTCGAGATCACCATGTGC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I I N R A Q E E K I S Q K D L A R K F E R E Y I
- - - - - - - - - - - - - - - - R K F E R E Y I
------------------------------------------------AGCTGCGATAAATGCATCCCGTCC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K D M L S L G I D S V S Y H A R A T T H I P E I
K D M L S L . . . S - - Y H A R A T T - - - - -
TTCAGGATAGGGACCATT---------TGC------ACGGATGTGTTCCAGGGCTTT---------------
121122123124125126127128129130131132133134135136137138139140141142143144
I N Q I E R L V G I G V G Y I T E T G V Y F N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D S F P R N G E L S G Q S K D K R I S R V T D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K K H N P A D F V L W K R G E Y G E Y T W D S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W G R G R P G W H I E D T A I T E K Y F G Q Q Y
- - - - - - G W H I E D T A I T E - - - - - - -
------------------GATAAGATCCAGCCCGCCGCCATGGATATCATA---------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D I H G G G L D L I F P H H E A E I A Q M E S L
- I H G G G L D L I F P H . E A E I A Q M E S L
---AATGGCAGTATCCTCAATATGCCAGCCCGGACGGCC---TCCCCACGGAGAGTCCCAGGTATATTCACC
241242243244245246247248249250251252253254255256257258259260261262263264
E G K H P M V R Y W M H T G F L T V E G E K M S
- - - - - - V . Y W M H T - - - - - - - - K M S
------------------TAA---AAAATCTGCAGGATT------------------------GCTGATTCG
265266267268269270271272273274275276277278279280281282283284285286287288
K S L G N F I K I Q D A L K T W D K D I I R Y F
K S - - - - - - - - - - - - - - - - - - - - - -
TTTATC------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I L L S H Y R S P L Q V S E E G L L N A K K A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E H I R A I A I T D N G P Y P E G R D A F I A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
M E S D L N T P N A I A A I H A L A A H G D L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A L I E Y G E I L G I R F L P E T S A P L S I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q D I R A E L R A S K Q F E I A D M I R K K I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423
D A G I Q V T D P P L K P L K
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_cys_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L Y L Y N T L T S R K E A F I P L E E P F V K
- - - - - - - - - - - - - - - - - - - - - - - K
---------------------------------------------------------------------AAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M Y T C G V T P Y D K A H V G H L R T Y L V T D
M Y T . G V T P Y D K A H V G H L R T Y L V T D
ATGTATACC---GGGGTTACTCCTTATGATAAAGCACATGTGGGACATTTAAGAACTTATTTAGTTACGGAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L L R R I L R F L G Y Y D I A V T N F T D I D D
L L R R I - - - - - - - - I A V T N F T D I D -
TTGTTAAGAAGAATA------------------------ATAGCAGTAACCAATTTTACAGATATAGAT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K I I K K S Q E L N K D W K E I V E E N I K Y V
- - - - - - - - - - - - - - - - - E E N I K Y V
---------------------------------------------------GAAGAAAACATTAAATATGTG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F D V L K E L K V L P F Y V Y P R V T Y H I D D
F D V L K E L . . . . . Y V Y P R V T Y - - - -
TTCGATGTTCTAAAAGAACTA---------------TACGTTTATCCAAGGGTTACTTAC------------
121122123124125126127128129130131132133134135136137138139140141142143144
I A N A V K S L L D R G Y A Y K G K Y S I Y F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V D K Y P Y Y G Q L S G I K S K K E W E Q E K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L E D K K N P Y D F A L W K F K Q P G E P Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N T I V G E G R P G W H I E C S V M S S K Y L G
- - - - - - - - - G W H I E C S V M S S - - - -
---------------------------GGTTGGCATATAGAATGTTCTGTTATGTCTTCC------------
217218219220221222223224225226227228229230231232233234235236237238239240
E R F D I H L G G S D L I F P H H E N E I A Q S
- - - - I H L G G S D L I F P H . E N E I A Q S
------------ATCCATTTGGGGGGAAGTGATTTGATATTTCCACAT---GAAAATGAAATAGCGCAAAGC
241242243244245246247248249250251252253254255256257258259260261262263264
E T L Y N V H P W V R Y W V H I G M V Q I N G E
E T L - - - - - - V . Y W V H I - - - - - - - -
GAAACCTTA------------------GTT---TATTGGGTCCATATT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K M S K S L G N I I E A K E F I K K Y K P E F V
K M S K S - - - - - - - - - - - - - - - - - - -
AAAATGTCTAAAAGT---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R F F L L S T H Y R K P L D I S E E N I E Q A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T I Y K K L T D A Y N T A K S I V E N E V S Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F D K D V R I I L D Y Y R E M I K A F L D D M N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T P T A I A S L N K I V S I F N Q N P E Y P I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y L T L R A F E D F N R I M N V W F E K P I D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D I I N E I I E I R N M L R R E K Q Y E L A D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I R D I L Q K K G I K I K D Y K D K T V W Y A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457
I
-
---
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_cys_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T L S L Y N T L T R Q K Q R F E P L Q A G S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S L Y C C G V T V Y D Y C H L G H A R S Y I V W
S L Y C . G V T V Y D Y C H L G H A R S Y I V W
GCGAATCCGATC---TTCCGCAAAATCTTTGGCTTGACGAGCTGCATGACGCTTGGCAATCCAGTCTTCGAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D T L R R Y L L W L G Y R V R Y V Q N F T D I D
D T L R R Y - - - - - - - - R Y V Q N F T D I D
CGCGGCTTCATCGAGTTC------------------------AGCTTCTAGGCCCAGCACACCGGCGAGCTG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K I L R R S R Q E G T T M Q A I A D R Y T Q A
- - - - - - - - - - - - - - - - - - D R Y T Q A
------------------------------------------------------TTCGTGGATCAGGAGGTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y F E D M A R L N I L E A D D Y P R A T H T L D
Y F E D M A R L . . . . . D D Y P R A T H - - -
TTGCTGGCGGCGCAATTCCTTGGC---------------AGCGAGGGCAGCAGGCGTATTGAG---------
121122123124125126127128129130131132133134135136137138139140141142143144
G I Q R L I A E L E D K G F A Y A A D G D V Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S V R R F Q D Y G K L S G R K L E D L K A G A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G R V E S A E E S L K H D P F D F A L W K A A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P E E P A W D S P W G P G R P G W H I E C S A M
- - - - - - - - - - - - - - - G W H I E C S A M
---------------------------------------------GGACATTTTTTCGCCGCCAACATTGAC
217218219220221222223224225226227228229230231232233234235236237238239240
V R D R L G D S I D I H V G G A D L V F P H H E
V R - - - - - - - - I H V G G A D L V F P H . E
CATGCC------------------------GGGGTGGCCGGTGACGGCTTCCGATTGGGCTATCTC---TTC
241242243244245246247248249250251252253254255256257258259260261262263264
N E I A Q S E A V T G H P L A R Y W L H N G M V
N E I A Q S E A V - - - - - A . Y W L H N - - -
ATGGTGCGGAAACACGAGATCAGCACC---------------AAT---GTCCCCAAGGCGATC---------
265266267268269270271272273274275276277278279280281282283284285286287288
N V G G E K M S K S L G N F T T I R Q L L D E G
- - - - - K M S K S - - - - - - - - - - - - - -
---------------ATGCCAGCCCGGACG------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G I S P M V L R L F V L Q A N Y R K P I D F T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E A L Q A C Q N G W E T L Q E G L H F G E H W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D R L G W T E S V T V D P D L S D R F R M A M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D D L N T P A A L A V L F E L A K E L R R Q Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L L I H E G H L D G D A Q Q L H Q H W V T L V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L A G V L G L E A E P E L A E T N E L D E A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E D W I A K R H A A R Q A K D F A E A D R I R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478
Y L A D L G I T L I D Q A G G I T R W S R T
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_cys_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I T N T L T G K K E E F V P I Q P G V V R M
- - - - - - - - - - - - - - - - - - - - - - R M
------------------------------------------------------------------AGGATG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y V C G P T V Y D L I H V G N A R P A L V F D V
Y V . G P T V Y D L I H V G N A R P A L V F D V
TACGTG---GGACCCACCGTGTACGATCTCATCCACGTGGGGAACGCGAGACCCGCGTTGGTATTCGATGTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F R R Y L E Y R G Y R V I M V Q N F T D I D D K
F R R Y - - - - - - - - I M V Q N F T D I D - -
TTCAGGAGGTAC------------------------ATAATGGTTCAGAATTTCACGGATATAGAC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I I N K A N Q L G V D Y K T V A D T F I A E Y W
- - - - - - - - - - - - - - - - D T F I A E Y W
------------------------------------------------GATACCTTCATAGCCGAGTACTGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R D A H A L G I R P A N F H P R T T D F V E D I
R D A H A L . . . . . N F H P R T T D - - - - -
AGAGACGCACATGCGCTT---------------AATTTTCATCCAAGAACCACCGAT---------------
121122123124125126127128129130131132133134135136137138139140141142143144
V E I I E K L V E K G F A Y Q T E T G V Y F D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R K F E K Y G E L S K K K I E D L I A G A R V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V D E T K K S P L D F S L W K K A K P G E P C W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K S P W G E G R P G W H I E C T V M S V K I L G
- - - - - - - - - G W H I E C T V M S V - - - -
---------------------------GGTTGGCACATAGAGTGTACGGTTATGTCCGTG------------
217218219220221222223224225226227228229230231232233234235236237238239240
E S F D I H A G G E D L V F P H H E N E K A Q A
- - - - I H A G G E D L V F P H . E N E K A Q A
------------ATACACGCGGGTGGAGAAGATCTCGTGTTTCCGCAC---GAGAACGAGAAGGCTCAGGCC
241242243244245246247248249250251252253254255256257258259260261262263264
E A L T G K V F A R Y W M H N G M V R F L G D K
E A L - - - - - A . Y W M H N - - - - - - - - K
GAAGCCCTG---------------GCG---TACTGGATGCACAAC------------------------AAG
265266267268269270271272273274275276277278279280281282283284285286287288
M S K S T G N I F T V R E A V K R Y G R D G L R
M S K S - - - - - - - - - - - - - - - - - - - -
ATGAGTAAATCG------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y M I L S K H Y R S P M D F S E E L L Q D Y S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A V K R V W E I L G R Y E K S G D I G I P K R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A V Y E E Y V N R F V E A L D D D F N T P V A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S L I F E L A R N L S K A M D D N D R E D A L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y Y H L I R R E F G P V L G L F D L N E E K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V S S E E L L K L L I E V R D V L R K E K R Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L S D R I R D R L R E I G I I L K D T P S G T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460
Y T V E
- - - -
------------
Class I
Bacteria/Thermus thermophilus/amino acid sequences/Tthermophilus_cys_aa
Bacteria/Thermus thermophilus/nucleotide sequences/Tthermophilus_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G L V I Y D T L A R R K V P F E P A V P G H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G I Y V C G P T V Y A D P H L G H A R G P V V Y
G I Y V . G P T V Y A D P H L G H A R G P V V Y
CCGGATGAGGTC---TTTTTCGTAGTCCTTGGCCCGCCTCGCCTCTTCCCTAAGCTCCAGGAGGAGGGCGAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V L R R Y L L H K G Y K V R F V S N I T D V G
D V L R R Y - - - - - - - - R F V S N I T D V .
GAGGCCCTCGAGGAGGGG------------------------CCTCTCGGGAAAGAGGCCGAGGATCCC---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H L T D D A D E G E D K I V R R A K L E R L E P
. . . . . . . E - - - - - - - - - - - - - - - -
---------------------CTC------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M E V A E K Y T W S Y F D A M Q A L N V L R P S
- - - - E K Y T W S Y F D A M Q A L . . . . . S
------------GGCGAAGAGGGCGGCCAGGGCCTCGGGAGTGGAGAGGTCGTC---------------GAA
121122123124125126127128129130131132133134135136137138139140141142143144
I A P R A S G H I P E M L E L T E R L L A R G V
I A P R A S G - - - - - - - - - - - - - - - - -
GGCCTTTTCCAGGGCGTCCAG---------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A Y E R K G S V Y F R V R S F P E Y G K L S G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R L E E L R A G A R V E V R E E K E D P L D F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L W K A A E P G H I M R W K S P W G E G Y P G W
- - - - - - - - - - - - - - - - - - - - - - G W
------------------------------------------------------------------GTGGTG
217218219220221222223224225226227228229230231232233234235236237238239240
H I E C T A M S L K Y L G E G F D L H A G G I D
H I E C T A M S L - - - - - - - - L H A G G I D
CATCCAGTGCCGGGCGAAGCGGAAGCC------------------------GCACTCGTGGTGGGGAAACTG
241242243244245246247248249250251252253254255256257258259260261262263264
L Q F P H H E C E I A Q A E A A G F R F A R H W
L Q F P H . E C E I A Q A E A A - - - - A . H W
CAGGTCAATCCCCCC---GTGGAGGTCAAAGCCTTCCCCCAGGTACTT------------CGT---CTCAAT
265266267268269270271272273274275276277278279280281282283284285286287288
M H H N H V L L E G E K M A K S T G N L V L L H
M H H - - - - - - - - K M A K S - - - - - - - -
GTGCCAGCC------------------------CTTCCAGCGCATGAT------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D L L E A H E P M A L R F Y L L Q T H Y R S P M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D F T W E G L E S A K R G Y G R L L H A Y R E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R G R K K T A P P G T T P E L E R A L D A L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A F M E A I E D D L S T P E A L A A L F A F L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E L H K L L P E A K A E S L A R A E A V F H T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G E G I L G L F P E R V L E E R V S G P L L E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L I A L L L E L R E E A R R A K D Y E K S D L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R E R L R A L G V I V E D T K E G P R W R L E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_cys_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E H Q L T I Y N T L D R K K E L F V P L H A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
H V G M Y V C G P T V Y G D A H L G H A R P A I
- - G M Y V . G P T V Y G D A H L G H A R P A I
------CAAGTCACTGGT---CCAGTCTTTGTTGGCTTTTGCCTTCACACGTTGTTCCAGCAACATATCGAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T F D V L F R Y L T R L G Y K V R Y V R N I T D
T F D V L F R Y - - - - - - - - R Y V R N I T D
CACTTTTCCATAAGCGGCTTCACG------------------------TTTCAGACCCAGGATATCGAAGCA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V G H L E H D A D E G E D K I A K K A R L E Q L
V . . . E - - - - - - - - - - - - - - - - - - -
GAA---------TAC---------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E P M E V V Q Y Y L N R Y H K A M E A L N V L P
- - - - - - Q Y Y L N R Y H K A M E A L . . . .
------------------GTCAAAGAGATGTGAAATCACAATCGGAGTATTCAGGTCATC------------
121122123124125126127128129130131132133134135136137138139140141142143144
P S I E P H A S G H I I E Q I E L V K K I L D A
. S I E P H A S G - - - - - - - - - - - - - - -
---ACACTTCGTGCGCAAGCTTTTTAC---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G Y A Y E S Q G S V Y F D V A K Y N K D Y H Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K L S G R N L D D V L N T T R E L D G Q E E K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N P A D F A L W K R A Q P E H I M R W P S P W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D G F P G W H A E C T A M G R K Y L G E H F D I
- - - - G W H A E C T A M G R - - - - - - - - I
------------CATCCAATAGTGAACCATATCGTCACCCTGTGA------------------------TTC
241242243244245246247248249250251252253254255256257258259260261262263264
H G G G M D L I F P H H E C E I A Q S V A S Q G
H G G G M D L I F P H . E C E I A Q S V A S - -
GTGGTGCGGGAAGATAAGGTCCATGCCTCCTCC---AATGTCGAAGTGTTCGCCCAGATACTTACG------
265266267268269270271272273274275276277278279280281282283284285286287288
D D M V H Y W M H N N M I T I N G T K M G K S L
- - - V . Y W M H N - - - - - - - - K M G K S -
---------CTC---ATGCCAGCCGGGGAA------------------------GCGCATGATATGTTC---
289290291292293294295296297298299300301302303304305306307308309310311312
G N F I T L D E F F S G S H K L L T Q A Y S P M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T I R F F I L Q A H Y R S P V D F S N E A L Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A E K G L S R L M E A V D S L E K I T P A A T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N V D V K S L R T K C F E A M N D D L N T P I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I S H L F D G A K M I N N I I A G N N T I S A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D L K D L K E V F H T F C F D I L G L K E E I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S S D G R E A A Y G K V V D M L L E Q R V K A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A N K D W A T S D L I R N E L T A L G F E I K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491
T K D G F E W K L N K
- - - - - - - - - - -
---------------------------------
Class I
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_cys_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E S L R I Y N T L A R D K Q D F V P R Q P G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V R M Y V C G I T V Y D Y C H I G H A R M V V V
- R M Y V . G I T V Y D Y C H I G H A R M V V V
---CGGATGTACGTC---GGGATCACCGTCTACGACTATTGCCATATCGGCCATGCGCGGATGGTGGTCGTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F D I V Q R W L R A A G Y R V T Y V R N I T D I
F D I V Q R W - - - - - - - - T Y V R N I T D I
TTCGACATCGTCCAGCGCTGG------------------------ACGTACGTGCGCAACATCACCGACATC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D D K I I R R A L E N G E T I Q S L T R R F I D
D - - - - - - - - - - - - - - - - - - R R F I D
GAC------------------------------------------------------CGCCGCTTCATCGAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A M N A D F D A L G V E R P D I E P R A T D F I
A M N A D F D A L . . . . . D I E P R A T D - -
GCGATGAACGCGGATTTCGACGCGCTC---------------GACATCGAGCCGCGCGCGACCGAT------
121122123124125126127128129130131132133134135136137138139140141142143144
P Q M L G M I E K L E A N G Y A Y Q A K D G D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N Y S V R K F A N Y G K L S G K S L E D L R A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E R V A A K D A K D D P L D F V L W K R A K P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E P A G A S W E S K Y G A G R P G W H I E C S A
- - - - - - - - - - - - - - - - G W H I E C S A
------------------------------------------------GGCTGGCACATCGAATGCTCTGCG
217218219220221222223224225226227228229230231232233234235236237238239240
M G C T L L G E H F D I H G G G Q D L Q F P H H
M G C - - - - - - - - I H G G G Q D L Q F P H .
ATGGGCTGC------------------------ATTCACGGCGGCGGCCAGGACCTGCAGTTCCCGCAT---
241242243244245246247248249250251252253254255256257258259260261262263264
E N E I A Q S E G A T G Q T F V N Y W M H N G F
E N E I A Q S E G A - - - - - V . Y W M H N - -
GAGAACGAGATCGCGCAGAGCGAGGGTGCG---------------GTC---TATTGGATGCACAAC------
265266267268269270271272273274275276277278279280281282283284285286287288
V Q V D S E K M S K S L G N F F T I R E V L E K
- - - - - - K M S K S - - - - - - - - - - - - -
------------------AAGATGTCGAAGTCG---------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y D A E V V R F F I V R T H Y R S P L N Y S D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H L D D A R A S L T R L Y T A L K D V T P D A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P L D W S E A H A Q R F A A A M N D D F N T A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A V A V L F E L A T E V N R T R E P A L A R Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K R L A G L L G L L G R E P R E F L Q Q A A G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A R T G A L E P D E I E A R I A A R V A A K Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K N Y A E A D R I R A E L L E A G I A L E D K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465
G G S T E W R R V
- - - - - - - - -
---------------------------
Class I
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_cys_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R L L D S V T K E K I K L D K K D I S I Y L C
- - - - - - - - - - - - - - - - - - - S I Y L .
---------------------------------------------------------AGTATTTATTTA---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G P T V Y D D A H L G H A R S S V C F D L L R R
G P T V Y D D A H L G H A R S S V C F D L L R R
GGACCTACGGTTTATGATGATGCACATTTAGGACATGCAAGAAGTAGTGTTTGTTTTGATCTTTTGCGTAGG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L L A Q G N R V K F A R N Y T D I D D K I L K
V - - - - - - - - K F A R N Y T D I D - - - - -
GTT------------------------AAATTTGCTAGAAATTATACAGATATTGAT---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K M A Q S G Q T L E E I T E F Y I K S Y E E D M
- - - - - - - - - - - - - E F Y I K S Y E E D M
---------------------------------------GAATTTTATATCAAAAGTTATGAAGAGGATATG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R V L N V L D P D F K P R A T H Y I T A M L D L
R V L . . . D - - F K P R A T H - - - - - - - -
AGGGTTTTA---------GAT------TTTAAACCTCGTGCAACGCAT------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I K K L A K D G F V Y T L E D G I Y F D T S K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E K Y L S L S N R N L E E N I S R L S N E V Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R N E S D F V L W K F D E N F Y E S E F G K G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P G W H T E C V A M I D S I F E N T L D I H A G
- G W H T E C V A M I D - - - - - - - - I H A G
---GGTTGGCATACTGAATGTGTTGCTATGATTGAT------------------------ATACATGCTGGA
217218219220221222223224225226227228229230231232233234235236237238239240
G I D L L F P H H E N E A A Q C R C G C K R K L
G I D L L F P H . E N E A A Q C R C G - - - - -
GGGATAGATTTGCTTTTTCCTCAT---GAAAATGAAGCTGCGCAATGTCGTTGTGGA---------------
241242243244245246247248249250251252253254255256257258259260261262263264
A N I W L H N G F V K I D G E K M S K S L N N S
A . I W L H N - - - - - - - - K M S K S - - - -
GCA---ATTTGGCTTCACAAT------------------------AAAATGAGTAAAAGT------------
265266267268269270271272273274275276277278279280281282283284285286287288
F F I K D A L K E F M G E A L R F Y L L S S H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R S H F N Y S L S D L E N A K K R L D K F Y R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K K R L D L G E I S D F D V L N D I G I K S E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A K Q I L E I L N D D L N V S K A L A L L D D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I S S A N L E L D K E S K N K I L K Q N I K E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L S E L A K I F G F G F M D A T L Y F Q W G V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K E E R E E I E K L I L E R T E A K K N K D F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T A D A I R E Q L N S K K I T L L D T P N G T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462
W E K I N A
- - - - - -
------------------
Class I
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_cys_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T L T I Y N T L T R H Q E P F E T V E P G K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K M Y Y C G V T V Y D Y C H L G H A R A C I I W
K M Y Y . G V T V Y D Y C H L G H A R A C I I W
GATGCGGTCTGA---GGCAAAATTTTTTGCTTTTCTAGCAGCTTGCCTTTGTTCGAGCATAGCTTCAATTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V V R R Y L Q F L G Y E V T Y I Q N F T D I D
D V V R R Y - - - - - - - - T Y I Q N F T D I D
TGGATCGCTTAAACCGTC------------------------TGTGACGGTAAATCCTAAAACCTCAGCTAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K I L N R A R Q E N S S M E A V A E R Y I Q A
- - - - - - - - - - - - - - - - - - E R Y I Q A
------------------------------------------------------GCCCTGATGTACCAATAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y F E D M T R L N V K E A D A Y P R A T H T M N
Y F E D M T R L . . . . . D A Y P R A T H - - -
ATTGCCTTCTCGCGCCAATTCTTT---------------CACAGCCAATCCATTCGGGAAGTT---------
121122123124125126127128129130131132133134135136137138139140141142143144
G I Q R L I F E L E Q K G Y A Y P A D G D V Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A V K Q F P E Y G K L S G R K L E D L Q A G A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G R V D A E D P E G R K K Q E P F D F A L W K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A K P G E P A W E S P W G A G R P G W H I E C S
- - - - - - - - - - - - - - - - - G W H I E C S
---------------------------------------------------GTTGCCCAGGGATTTAGACAT
217218219220221222223224225226227228229230231232233234235236237238239240
A M V R D R L G D T I D I H A G G A D L I F P H
A M V R - - - - - - - - I H A G G A D L I F P H
TTTTTCCCCGTT------------------------CCAGTAGTGAGAGAGGGATTTGCCTGTAACAGCTTC
241242243244245246247248249250251252253254255256257258259260261262263264
H E N E I A Q S E A V T G K S L S H Y W M H N G
. E N E I A Q S E A V - - - - - S . Y W M H N -
---TTGGGCGATTTCATTTTCGTGGTGGGGGAA---------------CCC---ATGAATGTCGATCGT---
265266267268269270271272273274275276277278279280281282283284285286287288
M V K V N G E K M S K S L G N F I T I R E L L D
- - - - - - - K M S K S - - - - - - - - - - - -
---------------------TGCCGAACATTCAAT------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R P T D P M A V R L F V L Q A H Y R K P I D F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D E A I A A A T N G W H T L R E G L L F G H Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G K Q L E F G I R N S E F G I E D N F I P E V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q R F K E A V N D D F N F P N G L A V L Q P L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K E L A R E G N L L V H Q G K T E T P P E E L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R Q W H T L V T L A E V L G F T V T I E A E T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T H D G L S D P E I E A M L E Q R Q A A R K A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N F A E S D R I R D E L Q A R G I T V I D S R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487
G T R W H R N
- - - - - - -
---------------------
Class I
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_cys_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S L R I Y N T L S G K V E E F V P I N P P K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L I Y T C G V T V Y D D S H V G H G R S L I V F
L I Y T . G V T V Y D D S H V G H G R S L I V F
TTTGTCCCTTAT---GTCTGCAACTTTAAACACCTTTTCCTTTCTGGCTATATTTCTGGCTTCTATGAGTAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V F R R F L E H L G Y Q V K F V R N F T D V D
D V F R R F - - - - - - - - K F V R N F T D V D
CTGTATTAATTTCTCGTC------------------------CCTTTCAACCACTCTCTCAACCTTGCACTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K I I N R A K Q E C T D F M T I A D R Y I A R
- - - - - - - - - - - - - - - - - - D R Y I A R
------------------------------------------------------TTTTGACGCAAACTCGTA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y Y V D M E N I R V R P A D V E P R V T E H I P
Y Y V D M E N I . . . . . D V E P R V T E - - -
TGCGGAGAGTTCCCTGTCCGTTAT---------------AGCCTTGTTCTTTACCTTGTTCAG---------
121122123124125126127128129130131132133134135136137138139140141142143144
E I I E V I Q K L V E K G Y A Y V V E G D V Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S V K K F K D Y G K L S K R D I E E L I A G A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V E P S E K K R D P L D F A L W K A S K A G E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A W D S P W G K G R P G W H T E C V A M V F K H
- - - - - - - - - - - G W H T E C V A M V F - -
---------------------------------AACCAGGAGTCTCAACACATCTGGGTGATACTT------
217218219220221222223224225226227228229230231232233234235236237238239240
L G E T I D I H G G G L D L V F P H H E N E I A
- - - - - - I H G G G L D L V F P H . E N E I A
------------------GTAATTTCCGAGGGATTTTGACATTTTCTGACCGCC---GGTAACGAGTCCGTT
241242243244245246247248249250251252253254255256257258259260261262263264
Q A E A I T G K P F A R Y W M H N G L V T V G G
Q A E A I - - - - - A . Y W M H N - - - - - - -
GTGCATCCAGTATCT---------------CGT---CGCTTCCGCCTGAGC---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q K M S K S L G N Y V T L R E V Y T K Y H P D V
- K M S K S - - - - - - - - - - - - - - - - - -
---CACGAGGTCAAGTCC------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L R L L V L F T H Y R S P L D F S W E K M E E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L K A Y E R L K N A I E D L E L L K K L Q V V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S K E G G T H P L Y E Q V K E F E E N F Y A S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S D D F N T P E A L S H V Y K L V G E L N K V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N K A Y S E G K I T D R E L S A Y E F A S K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L N T M K K I F G L L E D L Y P E C K V E R V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E R E L E A G Q V F D E K L I Q I L I E A R N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A R K E K V F K V A D Y I R D K L K E L G I V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495
E D T P A G T K W K K R E G A
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_cys_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L P P N A V S S T S A L P R P F P L P E R G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V F L F S L R G H A M T Q P T I T Q D T A R Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N P N I T L Y D T M Q R Q K V P F V P G T P G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V G M Y L C G P T V Y S D A H L G H A K K E V A
- G M Y L . G P T V Y S D A H L G H A K K E V A
---GCCGAGGCTGCG---GGCGTCGCGCGCGCGCTCCAGGGTATCGCGTCCCACTGGCCCGGCATTGAGCGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F D V I R R A L T H F G Y Q V R Y V S N I T D V
F D V I R R A - - - - - - - - R Y V S N I T D V
GGTGTTCAGCTCGCCGGTCAG------------------------GGGCGTATTGAAGTCGTCGCGCATGGC
121122123124125126127128129130131132133134135136137138139140141142143144
G H L L N D A D E G E D K L Q A R A R L E Q L E
. . . . . . . . E - - - - - - - - - - - - - - -
------------------------GGC---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P M E V A D K Y F W S F F R D M D A L N V L R P
- - - - - D K Y F W S F F R D M D A L . . . . .
---------------TTCGTGCAGCGTTTCGCTGAGGCGGCGGTAGCCGTTCGCCGC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
S I N P R A T G H I Q E Q I K L I E E L I E K G
S I N P R A T G - - - - - - - - - - - - - - - -
CTCGTTCATCTCGGTCACGCTGCG------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
H A Y E S A G S V Y F D V R S W P E Y G K L S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R K L D D Q E E G T R E A V R D E K R D P R D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A L W K K A E P E H L M R W D S P W S V G F P G
- - - - - - - - - - - - - - - - - - - - - - - G
---------------------------------------------------------------------CGA
265266267268269270271272273274275276277278279280281282283284285286287288
W H I E C S A M S L K Y L G E G F D I H G G G L
W H I E C S A M S L - - - - - - - - I H G G G L
GCATTCGATGTGCCAGCCGGGAAACCCCAC------------------------CAGGTGCTCGGGCTCGGC
289290291292293294295296297298299300301302303304305306307308309310311312
D L Q F P H H E A E I A Q A E A A G H H F A R Y
D L Q F P H . E A E I A Q A E A A - - - - A . Y
CTTCTTCCACAGCGCGAA---GCGGGGGTCGCGTTTCTCGTCGCGCACGGC------------TTC---CTG
313314315316317318319320321322323324325326327328329330331332333334335336
W M H N N M L T I G G E K M S K S K G N F T T I
W M H N - - - - - - - - K M S K S - - - - - - -
GTCGTCGAGTTT------------------------GGGCCAACTCCGAAC---------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q D I L K K Y D P M V V R F L L V S S H Y R S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T E M N E E A F A S A A N G Y R R L S E T L H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I E R R L K D A P A G S D T A L D S K I A A R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T E F E D A M R D D F N T P K A V A S L F G L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G E L N T A L N A G P V G R D T L E R A R D A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R S L G G D V L G L F A E T G S A A S V A Q D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A S V I D A L M D L V L K A R Q N Y R L Q K Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A E A D E L R E T L G K A G I T V E D T K D G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532
R W K R
- - - -
------------
Class I
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_cys_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V K P R F H N T L T R K L D P L V P I V E G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V S M Y S C G P T V Y D F A H I G N F R T F L F
- S M Y S . G P T V - - F A H I G N F R T F L F
---GCGGGCGGCGTC---GGCGGCGTAGTC------GGCCCGGGCGGCGTCGATCGACCTGGCGAGGCCCGA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A D V L R R F L E A V G L R V H H V M N L T D V
A D V L R R F - - - - - - - - H H V M N L T D V
CGCCCAGGCGAGGTCGCGGGC------------------------CAGGACGCCGTCCATCAGCGCGAGCAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G H M T E D A S V D G G G Q D K M A A A G E R L
G - - - - - - - - - - - - - - - - - - - - - - -
GCC---------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L A A K K A G Q A H A A E V E D P H D P H Q V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A F Y I A A F K E D A A K L G L R V V A D G D Q
A F Y I A A F K E D A A K L . . . . . . D G . .
GGCGTCGGCCATCGGCAGCGTGGCCGCGAAGTGGCGGAGCTT------------------GTCCCG------
145146147148149150151152153154155156157158159160161162163164165166167168
N L P R A T E N V E A M L E L I G R L L G R G H
. L P R A T E - - - - - - - - - - - - - - - - -
---GGCCGTGAAGTCGGTCTG---------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A Y V A E D G A A Y F R V S S F P A Y G A L S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N A L E D L R G G A G G R V T A G H Q A A K E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P A D F L L W K P D A T H L M K W N P A Q L G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T G P A A E L G V G Y P G W H I E C S A M A R E
- - - - - - - - - - - - G W H I E C S A M A R -
------------------------------------CGAGCACTCGATGTGCCAGCCGGGATAGCCGAC---
265266267268269270271272273274275276277278279280281282283284285286287288
A L G R D R I D I H T G G E D N I F P H H E C E
- - - - - - - - I H T G G E D N I F P H . E C E
------------------------CCCCAGCTGCGCCGGATTCCACTTCATCAGGTGCGT---GTCGGGCTT
289290291292293294295296297298299300301302303304305306307308309310311312
I A Q S R C G N G R N G T E S F A N L W L H S R
I A Q S R C G - - - - - - - - - A . L W L H S -
CCACAGGAGGAAGTCGGCCGG---------------------------GGT---GCGGCCGCCGGCCCC---
313314315316317318319320321322323324325326327328329330331332333334335336
H L M V D G A K M S K S K G N F L T V R G V L E
- - - - - - - K M S K S - - - - - - - - - - - -
---------------------GCCCGAGAGCGCTCC------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G G F T G R P V D P A A L R L E L I R S S Y R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q T D F T A K G L R D S A S A V A K L R H F A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T L P M A D A A P A E D V R E H P A A H R F L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A L A D D L N T A G A L A A A F A F A A G E P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A D A Q S A G V L A L M D G V L G V L E A A A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A R D L A W A S G L A R S I D A A R A A K D Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A A D A A R A E L L G A G F T V K T T A E G T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510
A E A P L A
- - - - - -
------------------
Class I
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_cys_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I T L Y N T L T R Q K E V F K P I E P G K V K
- - - - - - - - - - - - - - - - - - - - - - - K
---------------------------------------------------------------------AAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M Y V C G P T V Y N Y I H I G N A R P A I N Y D
M Y V . G P T V Y N Y I H I G N A R P A I N Y D
ATGTATGTA---GGTCCTACGGTATATAACTACATTCATATTGGTAATGCAAGACCAGCAATTAATTATGAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V V R R Y F E Y Q G Y N V E Y V S N F T D V D D
V V R R Y - - - - - - - - E Y V S N F T D V D -
GTAGTGAGACGTTAC------------------------GAATATGTATCAAATTTTACAGATGTAGAT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K L I K R S Q E L N Q T V P E I A E K Y I A A F
- - - - - - - - - - - - - - - - - E K Y I A A F
---------------------------------------------------GAAAAATATATCGCTGCTTTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H E D V G A L N V R K A T S N P R V M D H M D D
H E D V G A L . . . . . T S N P R V M D - - - -
CATGAAGATGTTGGTGCTTTA---------------ACTTCAAATCCAAGGGTAATGGAC------------
121122123124125126127128129130131132133134135136137138139140141142143144
I I Q F I K D L V D Q G Y A Y E S G G D V Y F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T R K F E G Y G K L S H Q S I D D L K V G A R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D A G E H K E D A L D F T L W K K A K P G E I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W D S P F G E G R P G W H I E C S V M A F H E L
- - - - - - - - - - G W H I E C S V M A F - - -
------------------------------GGATGGCATATTGAATGTTCTGTAATGGCATTT---------
217218219220221222223224225226227228229230231232233234235236237238239240
G A T I D I H A G G S D L Q F P H H E N E I A Q
- - - - - I H A G G S D L Q F P H . E N E I A Q
---------------ATACATGCGGGTGGTTCAGATTTACAATTTCCACAT---GAAAATGAAATAGCACAA
241242243244245246247248249250251252253254255256257258259260261262263264
S E A H N H A P F A N Y W M H N G F I N I D N E
S E A H - - - - - A . Y W M H N - - - - - - - -
TCGGAAGCACAT---------------GCT---TATTGGATGCATAAT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K M S K S L G N F I L V H D I I K E V D P D V L
K M S K S - - - - - - - - - - - - - - - - - - -
AAAATGAGTAAATCA---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R F F V I S V H Y R S P I N Y N L E L V E S A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S G L E R I R N S Y Q L I E E R A Q I A T N I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N Q Q T Y I D Q I D A I L N R F E T V M N D D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N T A N A I T A W Y D L A K L A N K Y V L E N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T S T E V I D K F K A V Y Q I F S D V L G V P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K S K K A D E L L D E D V E K L I E E R N E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K N K D F A R A D E I R D M L K S Q N I I L E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466
T P Q G V R F K R G
- - - - - - - - - -
------------------------------
Class I
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_cys_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A L R V Y S T L D R E K K D F E K V T G K K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q S A D Y L G D T V T M Y V C G P T V Y K P S H
- - - - - - - - - - T M Y V . G P T V Y K P S H
------------------------------ACGATGTACGTC---GGGCCGACGGTCTACAAGCCGAGTCAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I G H M V G P V I F D T V K R Y L T Y L G Y K V
I G H M V G P V I F D T V K R Y - - - - - - - -
ATCGGGCACATGGTTGGCCCGGTCATCTTCGACACGGTGAAGCGCTAC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K W I V N I T D V D D K L I N R A K E L N T T V
K W I V N I T D V D - - - - - - - - - - - - - -
AAATGGATCGTCAACATCACGGACGTCGAC------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P E L S A K M T E D Y F A C L K S L N V T G I D
- - - - A K M T E D Y F A C L K S L . . . . . D
------------GCGAAGATGACGGAAGACTACTTTGCGTGCCTCAAATCGCTG---------------GAT
121122123124125126127128129130131132133134135136137138139140141142143144
H F P K A T D H I G G M I E V I Q A L I K K D Y
H F P K A T D - - - - - - - - - - - - - - - - -
CACTTCCCGAAAGCGACCGAC---------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A Y E V D D G V Y F D V A K D A D Y G K L S N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D P E Q M E A G A R L E P N P K K R N P G D F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L W K S K P G E P K E V Q F E S P F K C G R G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P G W H I E C T C M A I K E L G E T L D I H G G
- G W H I E C T C M A I - - - - - - - - I H G G
---GGGTGGCACATCGAATGCACCTGCATGGCGATC------------------------ATTCACGGCGGC
241242243244245246247248249250251252253254255256257258259260261262263264
G L D L Q F P H H E N E L A Q S E S W T D K P F
G L D L Q F P H . E N E L A Q S E S W - - - - -
GGGCTGGATCTCCAGTTCCCGCAC---GAAAACGAACTGGCCCAGAGCGAAAGCTGG---------------
265266267268269270271272273274275276277278279280281282283284285286287288
A H I W M H N G L L K M G S A K M A G S V G N V
A . I W M H N - - - - - - - - K M A G S - - - -
GCG---ATTTGGATGCACAAC------------------------AAGATGGCCGGCTCC------------
289290291292293294295296297298299300301302303304305306307308309310311312
V N I A D L L K K H T A E T V R F L L L S T H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R S P I E Y S E E R L D E I A R S L Q G F Y R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F E R Y E R Y T G V N F Y S I K A P E T Q E A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S K L Y N R R T E G E N W F E S F C G A L D E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F N T G N A I G F L Y Q L L N E L N R H A D R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G Y E E H P E K R K G Q Q F V D F T E G G I A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R T M G T I L G L F W E P P A K Q S L G G N D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L V S G L M Q L L L D L R N N L R A T A K E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K D N P L K K P L F D Q T D L I R K R L G E L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519
V T L E D R P G G T T W R V G
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_cys_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K Y I Y V C G P T V Y N K V H I G N M K P I M
- - Y I Y V . G P T V Y N K V H I G N M K P I M
------CAACTTTTTTTC---TAATTCTAGAAATAATTTATCTGAAATTTTGAAATTTTTATTTGTTTTTTC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T F D L F L R G A N F I E K Q Y L F L H N L T D
T F D L F L R G - - - - - - - - L F L H N L T D
TATTTTTCATTTCAAAAACAAATC------------------------TGAGCTAAATTTAAACCCTAATAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I D D K I I E K A S K E N K T E L E I S E L Y S
I D - - - - - - - - - - - - - - - - - - E L Y S
TTTAAA------------------------------------------------------AATTTGCAAATT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D F Y L K M L D E Y N I N K P D Y I E K V T D N
D F Y L K M L D E Y . . . . . D Y I E K V T D -
AATTTCAAAATTTATTTTGCTAAATTCAAA---------------AGCAATTTTTTCAAGATATTTTTG---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I N M I I E Y I G L L V K K G S G Y I K K G S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y F D T T K Y P E Y G S I S N L N L N K T L D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D D D F K N E K N N P H D F V L W K K T K V G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T W K S P W S E G R P G W H T E C S A L I N H I
- - - - - - - - - - - G W H T E C S A L I N - -
---------------------------------TCCAACATGCAATCATTTTTTTGCCAAAGAAAG------
193194195196197198199200201202203204205206207208209210211212213214215216
F K K D Q I D I H G G G I D L I F P H N E N E N
- - - - - - - I H G G G I D L I F P . N E N E N
---------------------TTCATTTTCATTATGGGGAAAAATCAAATCTAT---CCCTCCGTGAATATC
217218219220221222223224225226227228229230231232233234235236237238239240
I Q N I A L H G L S L A K K W L H V G H I K W E
I Q N I A L - - - - - A K . W L H V - - - - - -
AATTTGATCTTTTTTGAA---------------AGCTGA---TTCTGTGTGTCA------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N E K M S K S L N N F I L A D D F I E K Y G N D
- - K M S K S - - - - - - - - - - - - - - - - -
------ACTTTTTCAAGTTAT---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T F R T L I L N T S F S T P I S I N E E I L E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N K K I S N K Y Q V T F N Q A N L L I M Q S K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R Q N E V E T Q K Y L E K I A K L L E N F E F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K I N F E I N L Q I K L F N S V V D L D A A N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L V E C F K L L G F K F S S Q N V S Q K D L D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F L K W K I E K T N K N F K I S D K L F L E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413
E K K L V
- - - - -
---------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_cys_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I L K L Y N T R T K D F S E L T N F E N V K V
- - - - - - - - - - - - - - - - - - - - - - K V
------------------------------------------------------------------AAAGTG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y A C G P T V Y N Y A H I G N F R T Y I F G D L
Y A . G P T V Y N Y A H I G N F R T Y I F G D L
TATGCT---GGGCCTACTGTTTATAATTATGCTCACATCGGGAATTTTAGAACTTATATTTTTGGAGATTTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L I K T L R F L G Y K V N Y A M N I T D I G H L
L I K T - - - - - - - - N Y A M N I T D I G - -
TTAATTAAAACT------------------------AATTATGCGATGAATATTACAGATATTGGA------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T G D L D D G E D K V A K T A R E K G L T V Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I S E F F T E A F F N D C R K L N I V Y P D K V
- - E F F T E A F F N D C R K L . . . . . D K V
------GAATTTTTCACAGAGGCTTTTTTTAACGATTGTAGAAAATTA---------------GACAAAGTT
121122123124125126127128129130131132133134135136137138139140141142143144
L V A S K H I P I M I E V V K I L E E K K I T Y
L V A S K - - - - - - - - - - - - - - - - - - -
CTTGTTGCAAGTAAA---------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F S N G N V Y F D T S C F K S Y G E M A G I D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I D K D M T L P R V D V D K F K R N K T D F V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W F T N S K F K D Q E M K W D S P W G F G Y P S
- - - - - - - - - - - - - - - - - - - - - - - S
---------------------------------------------------------------------AGT
217218219220221222223224225226227228229230231232233234235236237238239240
W H L E C A A M N L E Y F K D A L D I H L G G V
W H L E C A A M N L - - - - - - - - I H L G G V
TGGCATTTGGAGTGCGCTGCGATGAATTTG------------------------ATTCATTTGGGAGGAGTT
241242243244245246247248249250251252253254255256257258259260261262263264
D H I G V H H I N E I A I A E C F L N K K W C D
D H I G V H . I N E I A I A E C F - - - - - C .
GATCATATTGGAGTTCAC---ATAAATGAAATAGCAATAGCAGAGTGTTTT---------------TGT---
265266267268269270271272273274275276277278279280281282283284285286287288
V F V H G E F L I M D Y N K M S K S R G N F I T
V F V H G - - - - - - - - K M S K S - - - - - -
GTCTTTGTTCATGGA------------------------AAGATGTCAAAGTCA------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V K D L E D Q N F S P L D F R Y L C L T S H Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N Q L K F S L D N L Q A S K I A R E N L I N K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S Y F Y E S L D P V D L N T L N K D L K N F G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S V E K E Y Y D S F V E K I S F D L N V A Q G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A L L W E I I K S D N L S F V S K L R L A F I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D E I M S L N L R E E I L K N L Q N H D V V I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E N M K A L I E E R R I A K C E K N F K R A D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I R D F F A K K G F V L V D T K E G T K V K R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_cys_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H N S L Q V Y N S L T R Q Q E T F T P T N P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y V G M Y V C G P T V Y G P A H L G H A R C Y V
- - G M Y V . G P T V Y G P A H L G H A R C Y V
------GGTATGTATGTT---GGGCCTACTGTATATGGTCCAGCGCACTTAGGACATGCACGTTGTTATGTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T F D V I Q R Y L T H L G Y Q V R Y V R N I T D
T F D V I Q R Y - - - - - - - - R Y V R N I T D
ACGTTTGATGTAATACAGCGTTAT------------------------AGGTATGTAAGAAACATTACGGAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V G H L E R D A D E G A D K I A K Q A S L E N V
V G - - - - - - - - - - - - - - - - - - - - - -
GTAGGC------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E P M E V V Q R Y M N S F H R D M A L L N V Q P
- - - - - - Q R Y M N S F H R D M A L L N - - -
------------------CAACGCTATATGAATAGCTTTCATAGGGATATGGCTTTGCTTAAT---------
121122123124125126127128129130131132133134135136137138139140141142143144
P N I E P Q A S G H I P E Q I R M I Q E I M N Q
- - I E P Q A S G - - - - - - - - - - - - - - -
------ATTGAACCACAGGCTAGTGGC---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G L A Y E V N G S V Y F N I M A Y R E K Y H Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K L S G R N I D D L L A G T R V L A G Q Q E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F P L D F A L W K K A N N T H I M R W P S P W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E G F P G W H I E C T A L A T K Y L G S C F D I
- - - - G W H I E C T A L A T - - - - - - - - I
------------GGTTGGCATATAGAATGTACAGCCCTTGCTACC------------------------ATT
241242243244245246247248249250251252253254255256257258259260261262263264
H G G G M D L L F P H H E C E L A Q S Q A A Q H
H G G G M D L L F P H . E C E L A Q S Q A A - -
CATGGAGGTGGTATGGACCTGTTGTTTCCGCAC---GAGTGTGAATTAGCACAATCGCAAGCAGCC------
265266267268269270271272273274275276277278279280281282283284285286287288
T T L A K Y W L H N N L V T I N D Q K M S K S L
- - - A . Y W L H N - - - - - - - - K M S K S -
---------GCT---TATTGGTTGCATAAT------------------------AAGATGAGTAAATCC---
289290291292293294295296297298299300301302303304305306307308309310311312
G N S I T L D E L F Q G I H P L L D R A Y S P M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V L R F F I L Q A H Y R S T L S F T N E A L Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A E K G Y L K L I N G L K T T K D M K Y A P I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L G N V D E A M V A Q V E K H M A A C Y Q A M N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N D F N T A K L I A E L F H L L K F I H A L A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R Q V D F Y K L G E K V F E T L K K T Y I Y I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E D I L G L R E D Y K A V P A D L L S V I L K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Y S Q A K Q Q K N Y E Q I E M L R A E L R V L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495
I I V Q D T T R G V E W S H A
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_cys_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A A F P T S V W L T N S L T G R L E E L R T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A P S T V L A Y I C G P T V Y D S T H L G H A R
- - - - - L A Y I . G P T V Y D S T H L G H A R
---------------ATTACCGTCAGG---CGTCTCGGCCAAGTGAGTGGGAATCCCACGCTCATCAAAAGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T Y V T F D V V R R I L E D Y F G L R V R Y Q C
T Y V T F D V V R R I - - - - - - - - - R Y Q C
TGAGAACTCCACGTTCTCTAGAAACATCTTCTC---------------------------TAAACGCTGCTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N I T D V D D K I I A R A V E R G S S I F D I C
N I T D V D - - - - - - - - - - - - - - - - - -
CTCAAGCTTTTCCTGCTG------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R K Y E Q E F L S D M H T L S V R P F T V V T R
R K Y E Q E F L S D M H T L . . . . . T V V T R
TTGGACCTTCCACTCCTCAACGTTTATCGGCTTAATATAAGA---------------TTCGATAGCAAATCC
121122123124125126127128129130131132133134135136137138139140141142143144
V T E Y M A D I I L F I Q K I M D N G F A Y V S
V T E - - - - - - - - - - - - - - - - - - - - -
TGTCAATGG---------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A G S V Y F D V A A A R S A G Y S Y P K L R P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G S S S D E L Q L L I Q N A D G M D S K N R V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E K R S A S D F A L W K A W K E T E P E D A K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D A T F S H K N G A V S E L I T L P G R P G W H
- - - - - - - - - - - - - - - - - - - - - G W H
---------------------------------------------------------------ATCGTTGCG
241242243244245246247248249250251252253254255256257258259260261262263264
I E C S A M A A A V L G K D T G G A F D L H L G
I E C S A M A A - - - - - - - - - - - - L H L G
GAAGGCCGTATCCACGTTGGAGAG------------------------------------TGTACTGTATCT
265266267268269270271272273274275276277278279280281282283284285286287288
G C D L Q F P H H D N E L I Q L E T W A G K K N
G C D L Q F P H . D N E L I Q L E T W - - - - -
AAGGTTCTTGATTGGCTCAGAAAG---TTCCTCGTGCTGAATGATCTGGCGACAATT---------------
289290291292293294295296297298299300301302303304305306307308309310311312
M I G C F L H S G H L K I A G D V M S K S K K N
- I . C F L H S - - - - - - - - V M S K S - - -
---TTT---GTCCTTGGCAACTGC------------------------ATCCAGCGACGCGCT---------
313314315316317318319320321322323324325326327328329330331332333334335336
F K T V R E I L S I F T A N Q V R M L F C M V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y S A S L D Y S I S M M D A A V A K D K K I T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F L S N C R Q I I Q H E E E L S E P I K N L R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S T T E E A L E A Q T I E F L S N V D T A F R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D I N I V S A M S H V M L L I D N C K A Y I F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
C Q T E G R Q V S T F L L S N A R D K I V H V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S I M G F S Y A R G E T S T A E N A L Q V A R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V C N F R R E I K D L L M A S T T N T A E T D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K T L K K M L L G L C D R L R D E H L P L T G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A I E D A D K E S Y I K P I N V E E W K V Q R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R E L D L A E A K R L Q Q E K V Q Q E K L E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R L E R E K A L I P A E K M F L E N V E F S A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D E R G I P T H L A E T G P D G N P L P I P K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645
R Y K K L V K E W E A Q K K L N E K Y P S
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_cys_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S A N R V P T V V A G L D G A N P V K R E R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P A W Y P P L K L D G N G L K V M N S L T E T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E D F A P R D G R V V R W Y T C G P T V Y D L S
- - - - - - - - - - - R W Y T . G P T V Y D L S
---------------------------------CGATGGTACACG---GGCCCGACCGTCTACGATCTCTCT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H M G H A R A Y L T F D I I R R V M E D Y F G Y
H M G H A R A Y L T F D I I R R V - - - - - - -
CACATGGGCCACGCCCGTGCTTACCTCACCTTCGACATCATCCGCCGTGTC---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S V I Y Q M N I T D I D D K I I K R A R V N K L
- - I Y Q M N I T D I D - - - - - - - - - - - -
------ATTTATCAGATGAACATCACGGATATCGAC------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L D D F K E G E L R H G D V A R L M A F T A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V T A A E S G L A K R K A A L F E P I T E G A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S R A K A D R E E K L L E V Q L K E S Q L V E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K V K I A A A K D D F A A L F A A A S G V N G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L L D E R S G H S V S D Q Q I F E D H A R K Y E
- - - - - - - - - - - - - - - - - - - - R K Y E
------------------------------------------------------------CGAAAATACGAG
241242243244245246247248249250251252253254255256257258259260261262263264
R A F F E D M Q R L G I R E P D I V T R V T E Y
R A F F E D M Q R L . . . . . D I V T R V T E -
CGAGCGTTCTTCGAGGACATGCAGCGCTTG---------------GACATCGTGACGCGCGTCACGGAG---
265266267268269270271272273274275276277278279280281282283284285286287288
V P Q V V E F V Q K I I D N G F A Y V G E T S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F F D T E A Y I R A G H D Y P K L K P G G D R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T T E D E M A E G E G V L S K G I E G E K R S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N D F A L W K F S K P G E P R W P S P W G E G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P G W H I E C S V M A S D I L G E N M D I H S G
- G W H I E C S V M A S - - - - - - - - I H S G
---GGCTGGCACATCGAGTGCTCCGTGATGGCGTCC------------------------ATCCACAGCGGT
385386387388389390391392393394395396397398399400401402403404405406407408
G W D L K F P H H D N E C A Q S E A C N L H S Q
G W D L K F P H . D N E C A Q S E A C - - - - -
GGGTGGGACTTGAAGTTTCCGCAC---GACAACGAGTGCGCGCAGAGCGAGGCGTGC---------------
409410411412413414415416417418419420421422423424425426427428429430431432
W V N Y F L H C G H L H I K G L K M S K S L K N
- V . Y F L H C - - - - - - - - K M S K S - - -
---GTG---TACTTCCTCCACTGC------------------------AAGATGAGCAAGAGC---------
433434435436437438439440441442443444445446447448449450451452453454455456
F I T I R Q A L D E L G V T A R T M R L L F L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N P W N K P M N F S D Q S L D E A K E K E R V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R A F F G S V D I V L R T D N W K A T Q G A N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H D R E L L S K W V E A E A A V H A A L Q D N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D T V V A L Q Q L M S L V A A T N Q Y L L S G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R P S A T L V R K V G C Y V T K M F R I F G V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E G S D D V G L Q K Q G S G D G E A R F I E V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N T L V R F R D E V R D A A K D H K V V A G F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
P L C D K V R D E W L V D A G V R L E D N P A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
P T T W K S D E P A L L H K E L A E R R A Q Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G D R Q R R L A N Q A E T K R K L V E K W R Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
T Y P P S E Y F R L Q D E Q R V E K K Y A A Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D V T G L P T M T A A G E E V S E K E A K K L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
K E Q A K Y A K S Y D E F I G K G G V S W L Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784
Q E A E L A S M V A E L K G S N
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_cys_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S L K F T N T L T R Q L E S F T P I K D R K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S I Y C C G V T V Y D L C H L G H A R S Y I A W
S I Y C . G V T V Y D L C H L G H A R S Y I A W
TCTATTTACTGT---GGAGTTACTGTATATGATTTGTGTCACTTAGGTCATGCCCGTAGCTATATTGCCTGG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V L R R Y L I W R G Y E V T F V Q N F T D I D
D V L R R Y - - - - - - - - T F V Q N F T D I D
GATGTCTTAAGACGTTAT------------------------ACTTTCGTACAAAATTTTACTGATATTGAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K I L V R A A R E E S S M Q L V S D R N I E A
- - - - - - - - - - - - - - - - - - D R N I E A
------------------------------------------------------GACCGTAATATAGAGGCT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F K S D M A L L N I L P A D R M P R A T K C L D
F K S D M A L L . . . . . D R M P R A T K - - -
TTCAAGTCTGATATGGCCCTGTTA---------------GATAGAATGCCTCGAGCTACTAAA---------
121122123124125126127128129130131132133134135136137138139140141142143144
G I R S I I S D L E K K G V A Y S T E G D V Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S I K E Y A Q Y G K L S G K D L S K L Q E G A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G R I S A S E E V R K K N S F D F A L W K K A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I D E P S F T S P W G L G R P G W H I E C S T M
- - - - - - - - - - - - - - - G W H I E C S T M
---------------------------------------------GGATGGCATATAGAATGTTCAACGATG
217218219220221222223224225226227228229230231232233234235236237238239240
V R E E L G E T I D I H L G G A D L I F P H H E
V R - - - - - - - - I H L G G A D L I F P H . E
GTGCGA------------------------ATTCATCTAGGCGGTGCTGATCTTATATTTCCACAT---GAG
241242243244245246247248249250251252253254255256257258259260261262263264
N E I A Q S E M A N G K N L A N Y W L H N G M V
N E I A Q S E M A - - - - - A . Y W L H N - - -
AATGAAATTGCACAATCAGAAATGGCT---------------GCC---TATTGGCTTCACAAT---------
265266267268269270271272273274275276277278279280281282283284285286287288
N V N G Q K M S K S L G N F T T I R E L L A S G
- - - - - K M S K S - - - - - - - - - - - - - -
---------------AAGATGTCTAAGTCT------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I S P L A L R L F V L Q T H Y R K P L D F N S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A L K A A S I G W A N L N I A L S L G E R F K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N L Q W D L G E F T K L Y V L L M N K E D E S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q K K L K P K L I E I M D P L K L A Y Q N F I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A M D E D L N T S A A I A I L F K L A K P L R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L S N R L E R G E I I N S N S K T V L F E E L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
C Q W Q L L I G L A S I L G L R A E R L G E K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T S L S S N D I T V Q I K L R N E S K A K K D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L T A D R I R D F L K D K G I E L I D K P G N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510
T E W I Q H
- - - - - -
------------------
Class I
Eukaryotes/Crassostrea gigas/amino acid sequences/Cgigas_cys_aa
Eukaryotes/Crassostrea gigas/nucleotide sequences/Cgigas_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K L Y L Y N S L T K S R E P F A P I S N D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V K I Y S C G P T V Y D F P H I G N Y R S F L F
- K I Y S . G P T V Y D F P H I G N Y R S F L F
---AAAATTTACTCC---GGTCCAACGGTTTACGATTTTCCCCACATAGGTAATTACCGCTCCTTCCTTTTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S D L L H R T L K A F G Y R V K L V M N I T D I
S D L L H R T - - - - - - - - K L V M N I T D I
TCCGACCTCCTGCACCGCACA------------------------AAATTGGTGATGAACATCACCGACATC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D D K T I K A S L A H K E S L K S Y T D R Y T Q
D - - - - - - - - - - - - - - - - - - D R Y T Q
GAC------------------------------------------------------GATCGCTACACTCAA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A F L Q D L K D L Q I L Q A S H Y P R A T D N I
A F L Q D L K D L . . . . . S H Y P R A T D - -
GCCTTTTTGCAAGATTTAAAAGATTTG---------------TCCCACTACCCCCGCGCCACCGAT------
121122123124125126127128129130131132133134135136137138139140141142143144
K E M I E M I K V L L E K K H A Y I A D G S V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F R L S T F P N Y G K L N H F K L E D Q I V G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G G R N D S D E Y K K E N F S D F V L W K K Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E S D G D V F Y D S P F G K G R P G W H I E C S
- - - - - - - - - - - - - - - - - G W H I E C S
---------------------------------------------------GGTTGGCACATAGAATGTTCT
217218219220221222223224225226227228229230231232233234235236237238239240
A M S R R F L G D H F D I H T G G T D N R F P H
A M S R - - - - - - - - I H T G G T D N R F P H
GCTATGAGCCGC------------------------ATACACACAGGGGGCACTGACAACCGTTTTCCGCAC
241242243244245246247248249250251252253254255256257258259260261262263264
H E N E I A Q S E C F S G K D F V N Y W L H V A
. E N E I A Q S E C F - - - - - V . Y W L H V -
---GAAAATGAAATCGCCCAGTCAGAATGTTTT---------------GTC---TACTGGTTGCATGTA---
265266267268269270271272273274275276277278279280281282283284285286287288
H L L V E G E K M S K S L G N F Y T L R D L T K
- - - - - - - K M S K S - - - - - - - - - - - -
---------------------AAGATGAGCAAGTCG------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R N I N P L T L R Y M M L S T H Y R N P F N F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L E G V S A V E K A I A R V N R T V Q R L E E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q K E L A I E A A S D K K S P T E K K I H A N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D K V V E K M E R E I D R F Y Q A L A D D L N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S S A L S V L F D V L A L V N P L L D K N Q M T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D K I A K S L T V F L H K V D E I F C F I D F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S T E S K I P K D I S D L A E K R D E A R K N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D Y A L S D Q L R D E I I A K G Y K V E D A A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489
K T V V K K H D A
- - - - - - - - -
---------------------------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_cys_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_cys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L K I Y N S L T K K L E I F N P I D P N N V K
- - - - - - - - - - - - - - - - - - - - - - - K
---------------------------------------------------------------------TCT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y I C G P T V Y D H S H I G H A R T Y V S F D
I Y I . G P T V Y D H S H I G H A R T Y V S F D
AACTTCATC---AATATTATACAAGTCCTTCTTATTCACACCTTCTTTTAGTGCCATCCTAATTTTATTCCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V I R N I L E K Y F N Y N V T F V M N I T D I D
V I R N I - - - - - - - - - T F V M N I T D I D
AAAAATATTAATTAA---------------------------TCTTACTTTTTCTTCTTTATTAATCCCAAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K I I N K S K E T G M S M K D I T V K Y T N L
- - - - - - - - - - - - - - - - - - V K Y T N L
------------------------------------------------------TACTAAGTCTAATTTACT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F L E D M A L L N V R K P T V L T K V T E Y V D
F L E D M A L L . . . . . T V L T K V T E - - -
GTTAGTAAATGACACAAGTTCTAG---------------TGAAGGGGTATCAAAATTATTACT---------
121122123124125126127128129130131132133134135136137138139140141142143144
K I K E Y V K I L E N N G Y A Y E S N G S V Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D V M E Y K K K F K Y P I F R E E T V N N L G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S P N I Q D K K S P L D F A L W K K D N L F G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G R P G W H I E C S V M A N D V L G D Y I D I H
- - - G W H I E C S V M A N - - - - - - - - I H
---------TATACTTTTTATAGTAGTAAAATTTTTAAGAGA------------------------ATTTAA
217218219220221222223224225226227228229230231232233234235236237238239240
A G G V D L K F P H H E N E I A Q C Q A R Y Q K
A G G V D L K F P H . E N E I A Q C Q A R - - -
ATGTCCTGTGTGCATAAAATAATTAACCCA---TTTTTTCTGGTAGCGTGCTTGACATTGTGC---------
241242243244245246247248249250251252253254255256257258259260261262263264
K P W V N Y F M H T G H L N I N G L K M S K S L
- - - V . Y F M H T - - - - - - - - K M S K S -
---------CGG---TTTAAGATCAACCCC------------------------TCCCAATACATCATT---
265266267268269270271272273274275276277278279280281282283284285286287288
K N F T T I K S I L E R C T P I Q L R I L F L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H Q W N K D M N Y E E E Q I K F A Q N V E K K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F N F F M Y V N S I N N I S K I Y N K N D I E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L D L I S K T S K I V D V S F S N N F D T P S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I K A L L E L V S F T N S K L D L V S A C T L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q V R D F V K R I L D I L G I N K E E K V R D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D S E N L A K L I N I F R N K I R M A L K E G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N K K D L Y N I C D E V R D N L K D L G Y V L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467
D S K L E T L I K K L
- - - - - - - - - - -
---------------------------------
Class I
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_gln_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T A P H D A E G P S H D P L G F L R E A V Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D L D T G R C E L P V R T R F P P E P N G F L H
- - - - - - - - - - - R T R F P P E P N G F L H
---------------------------------AGGACCCGCTTTCCGCCGGAGCCCAACGGCTTCCTGCAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V G H A K A I C I D F G V A R A F G G P C L L R
V G H A K A I C I D F G V A R A - - - P C L L R
GTCGGCCACGCCAAAGCCATCTGCATCGATTTCGGCGTCGCCCGCGCC---------CCGTGCCTGCTCCGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F D D T N P V A E E A R Y A D A I R T D L A W L
F D D T N - - - - - A R Y A D A I R T D L A W L
TTCGACGACACCAAC---------------GCCCGCTACGCCGACGCGATCCGCACGGACCTCGCGTGGCTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G F E P S E I T H T S D H F D A L A G L A D R L
. . . . S E I T H T S D - - - - - - - - - - - -
------------TCGGAGATCACCCACACCAGCGAC------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I E G G L A Y V D E Q P V E A I R E Q R G S L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R P G T P S P F R D R P A A E S A A R F A E M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S G A A P E G S M V L R A K I D M A A P N L N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R D P V L Y R V L H A T H A R T G D A W K V Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T Y D F A H G Q C D A I E G V T H S L C S L E F
T Y D F A H G Q C D A - - - - - H S L C S L E F
ACCTACGACTTCGCCCACGGCCAGTGCGACGCG---------------CACTCGCTGTGCTCGCTGGAGTTC
241242243244245246247248249250251252253254255256257258259260261262263264
E D H R P L Y D W F I E K L G L F P S R Q I E F
E D H R P L Y D W F I E K L - - - - S R Q I E F
GAGGACCACCGCCCGCTCTACGACTGGTTCATCGAGAAGCTG------------TCCCGGCAGATCGAGTTC
265266267268269270271272273274275276277278279280281282283284285286287288
G R L N L T H T I T S K R K L R A L V D E G I V
- - - - - - - - I T S K R - - - - - - - - - - -
------------------------ATCACCAGCAAGCGG---------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G G W D D P R M P T L A G M R R R G Y A A A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R S F C D E L G V T K F V G T T E L A L L E H H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q R K H L N E T A E R R M A V M D P I E L V V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D F E E G R V D R L P A V N R P Q D G E E G A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R E L P F T R T L Y I E R E D F K E D A N R K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F R L T P G R E V R L R W A Y L V T C T G C E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D S D G N V V R V F A T H D P A S R G G N A P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G R K V K G T I H W V S A G H A I D A E C R L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R P L F A T A D P A E G A D E D P P R G W R E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L A P D S L E V V T A K A E P S L A D A G P G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P V Q F E R I G Y F H R E P G E R P V F H R V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562
P L R E D A G K R A
- - - - - - - - - -
------------------------------
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_gln_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S V R V R I A P S P T G N L H I G T A R T A V
- - - R V R I A P S P T G N L H I G T A R T A V
---------CGCGTTCGCATTGCTCCTAGCCCCACCGGCAACCTCCACATTGGCACGGCCCGCACTGCCGTC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F N W L F A R R H Q G Q F I L R I E D T D L E R
F N W L F A R R - - - Q F I L R I E D T D - - -
TTCAACTGGTTGTTTGCGCGGCGG---------CAGTTCATCCTGCGCATCGAAGATACAGAC---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S R S E Y T D N I L T G L Q W L G L N W D E G P
- - S E Y T D N I L T G L Q W L . . . . D - G P
------TCGGAATACACCGACAACATCCTGACCGGCCTCCAGTGGCTG------------GAC---GGCCCG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F Y Q T Q R L D L Y K A A V Q Q L L D S G K A Y
F Y Q T Q - - - - - - - - - - - - - - - - - - -
TTCTACCAAACCCAG---------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R C Y C T E A E L E A L R E S Q R A R N E A P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y D N R H R D L T P E Q E A A F Q A E G R E A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I R F R I D D D R E I A W T D L V R D R V V W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G S D L G G D M V I A R R S P A G T I G Q P L Y
- - - - - - - - - - - - - - - - - - - - - - L Y
------------------------------------------------------------------CTCTAC
193194195196197198199200201202203204205206207208209210211212213214215216
N L A V V V D D I D M T I S H V I R G E D H I A
N L A V V V D D I - - - - - H V I R G E D H I A
AACCTCGCGGTCGTGGTCGATGACATC---------------CACGTCATTCGCGGCGAAGACCACATCGCT
217218219220221222223224225226227228229230231232233234235236237238239240
N T A K Q I L L Y E A L G A A V P E F A H T P L
N T A K Q I L L Y E A L - - - - P E F A H T - -
AACACCGCCAAGCAAATCCTGCTCTACGAAGCGCTG------------CCCGAGTTTGCGCACACG------
241242243244245246247248249250251252253254255256257258259260261262263264
I L N K E G R K L S K R D G V T S I S D F Q N L
- - - - - - - K L S K R - - - - - - - - - - - -
---------------------AAACTCTCGAAGCGT------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G Y L P E A I A N Y M T L L G W S P V E G M D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R F S L A E A A T V F D F D R V N K A G A K F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
W D K L N W L N S Q V I K E K S A S E L V A L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q P F W S K A G V D T A A Y P A A W L E E L A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L L G P S L V T L T D I V G Q S Q L F F S Q G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E L Q E D A I A Q L G Q A G S K A V L Q Q I L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A L P S E A L T L E V A K G L I D Q A V K A A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V K K G I G M R S L R A A L M G S M Q G P D L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T S W V L L H Q A G Q A Q P R L Q A A I A A A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481
G
-
---
Class I
Bacteria/Thermus thermophilus/amino acid sequences/Tthermophilus_gln_aa
Bacteria/Thermus thermophilus/nucleotide sequences/Tthermophilus_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G L V P E C F I T E L V E R D L K E G K Y A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L V T R F P P E P N G Y L H I G H A R S I V L N
- V T R F P P E P N G Y L H I G H A R S I V L N
---CCGCCAGAAGTAGCCCAGGCGCTCCAGCTGGTAGCGGGTGTCCTCGGGGTCCTGGGCCACGCTCGGCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F G L A Q D Y G G E C N L R F D D T N P E T E K
F G L A Q D - - - E C N L R F D D T N - - - - -
AATGAAGCCCCGCTTCAC---------CTCGGGGTTGAGGTTTTGCAGGAAGTCCCC---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E E Y A R A I E E D V R W L G F R P T R V L Y A
E E Y A R A I E E D V R W L . . . . T R V L Y A
CTTGGTGCGGAAGAGCCTGCCGTAGAGCCTAAACTCCACGGG------------GGCGGAGACCCAGTGGAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S D Y F E T M Y Q C A L V L I Q E G K A Y V D D
S D - - - - - - - - - - - - - - - - - - - - - -
CACCCC------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L P E E E M S E L R A Q G K P S P Y R E R S V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E N L E L F E R M R R G E F P T G S R V L R A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I D P A H P N F K L R D P V L Y R I V H A P H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
H V G D R W V I Y P M Y D F A H P L E D F I E G
- - - - - - - - - - M Y D F A H P L E D F - - -
------------------------------GGGGTCCACCACGCCCAAGACCCTGGGGGCGAT---------
217218219220221222223224225226227228229230231232233234235236237238239240
V T H S L C T L E F E N N R T V Y D W V I E N L
- - H S L C T L E F E N N R T V Y D W V I E N L
------CCGCACCACCTCCTCAAAGAGGTCCATCTCTATCTGGGCCTCGTTCCTGGAGATCCCCGTCTTGCG
241242243244245246247248249250251252253254255256257258259260261262263264
K G K C G L P T S P R P H Q Y E F A R L D L S H
- - - - - - - - - - - P H Q Y E F - - - - - - -
---------------------------------CCTCCGCCTCAGGCCCCT---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T V L S K R K L I K L V E G G Y V S G W D D P R
- V L S K R - - - - - - - - - - - - - - - - - -
---CCAGCCCGAGACGTA------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L P T L R G L R R R G V R P E A I V E F V R K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G I S R N E A Q I E M D L F E E V V R D D L N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I A P R V L G V V D P L K V V L T N Y E G E E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I E A P Y W P R D I P K E G T R P L P F S P E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y I E R T D F S L N P P K G W K R L A P G Q R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R L R H A Y V I E L E D V V E E G G E V R L L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A R I V P G T L G A N P E D G V R P K G V I H W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V S A R H A L P V E F R L Y G R L F R T K D P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E G G D F L Q N L N P E A L V V K R G F I E P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V A Q D P E D T R Y Q L E R L G Y F W R D P V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548
S R P E A L V M N R I V P L K E G Y R V
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_gln_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T D M T D I K N E E A G E K K S L N F I E Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V E N D L K A G K N G G K V Q T R F P P E P N G
- - - - - - - - - - - - - - Q T R F P P E P N G
------------------------------------------CAAACACGGTTCCCGCCGGAACCAAACGGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y L H I G H A K A I C L D F G I A A A H G G V C
Y L H I G H A K A I C L D F G I A A A - - - V C
TACCTGCACATCGGGCACGCTAAAGCCATTTGTCTCGACTTCGGCATCGCTGCCGCA---------GTGTGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N L R F D D T N P T K E D M E Y V E A I Q E D I
N L R F D D T N - - - - - M E Y V E A I Q E D I
AACCTTCGTTTCGACGACACTAAC---------------ATGGAATATGTAGAAGCCATCCAGGAAGATATC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R W L G F Q W G N V Y Y A S D Y F Q Q L W D F A
R W L G - - - - N V Y Y A S D - - - - - - - - -
CGGTGGCTGGGA------------AACGTATATTATGCCTCAGAT---------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V T L I K E G K A Y V D E Q T S E Q I A Q Q K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T P T Q P G V E S P Y R N R P I E E S L A L F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K M N S D E A K E G S M V L R A K I D M A S P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
M H F R D P I M Y R I L H V A H H R T G T Q W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A Y P M Y D F A H G Q S D Y F E G V T H S L C T
- - - M Y D F A H G Q S D Y - - - - - H S L C T
---------ATGTATGACTTTGCACACGGTCAGAGCGACTAT---------------CACTCACTCTGTACA
241242243244245246247248249250251252253254255256257258259260261262263264
L E F V P H R P L Y D L F I D W L K E G K D L D
L E F V P H R P L Y D L F I D W L - - - - - - -
CTCGAGTTCGTGCCTCACCGTCCTCTTTACGATCTGTTCATCGACTGGCTG---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D N R P R Q T E F N K L N L N Y T L M S K R N L
- - - P R Q T E F - - - - - - - - L M S K R - -
---------CCCCGTCAGACGGAGTTC------------------------CTGATGAGTAAACGC------
289290291292293294295296297298299300301302303304305306307308309310311312
L I L V K E G L V N D W D D P R M P T L C G F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R R G Y S P E S I R K F I D K I G Y T T Y D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N D F A L L E S A V R E D L N A R A T R V S A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L N P V K L I I T N Y P E G Q V E E L E A I N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P E D P T A G S H T I E F S R E L W M E R D D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
M E D A P K K Y F R M T P G Q E V R L K N A Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V K C T G C K K D E N G T V T E V Y C E Y D P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T R S G M P D A N R K V K G T L H W L S C N H C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L P A E V R L Y D R L W K V E N P R D E M A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R E A K G C D A L E A M K E M I N P D S L T V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P H C Y I E K Y V A D M P A L S Y L Q F Q R I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y F N I D K D S T P G H L V F N R T V G L K D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582
W G K I N K
- - - - - -
------------------
Class I
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_gln_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T A L T G R L A P S P T G A Q H V G N A R T
- - - - - T G R L A P S P T G A Q H V G N A R T
---------------ACCGGCCGACTGGCCCCCTCGCCGACCGGCGCGCAGCACGTCGGGAACGCCCGCACG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y L V A W L A A R A G G G T V R V R I E D I D S
Y L V A W L A A R A - - - T V R V R I E D I D -
TACCTGGTCGCGTGGCTCGCGGCGCGGGCC---------ACCGTTCGGGTCCGCATCGAGGACATCGAC---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P R I K P G A A E Q A L D D L R W L G L D W D G
- - - - P G A A E Q A L D D L R W L . . D - - -
------------CCCGGCGCGGCGGAGCAGGCGCTCGACGACCTCCGCTGGCTC------GAC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E V V T Q T T R L P L Y E A A L E T L K Q A E Q
E - V T Q T T - - - - - - - - - - - - - - - - -
GAA---GTCACCCAGACGACG---------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I Y P C T C T R S D I A S A A S A P H A G E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T Y P G T C A H R S A A D A V V L Q R D G K P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A W R F R V A D S P A F T D L F A G E Q Q I D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K H A G G D F V V W K S A G T P A Y Q L A V V V
- - - - - - - - - - - - - - - - A Y Q L A V V V
------------------------------------------------GCTTATCAGCTCGCGGTCGTGGTG
193194195196197198199200201202203204205206207208209210211212213214215216
D D A A M G V T E V V R G D D L I P S T P R Q L
D D A - - - - - E V V R G D D L I P S T P R Q L
GACGACGCC---------------GAAGTGGTGCGCGGCGACGACCTCATCCCGTCCACGCCGCGGCAACTC
217218219220221222223224225226227228229230231232233234235236237238239240
L L Y R A L G L A P P A F A H V P L V V G A D G
L L Y R A L - - - - P A F A H V - - - - - - - -
CTGCTGTATCGCGCGCTG------------CCGGCGTTCGCGCACGTC------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R R L A K R H G D T R L A A L R S A G V K P E A
- R L A K R - - - - - - - - - - - - - - - - - -
---CGGCTCGCCAAGCGC------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L L G L L G W S C G W L D R P E P V R A R D L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A R F R L E T I P K R T F V L T A D L L S A I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315
Y A G
- - -
---------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_gln_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A G P A A A E V K E M E T K R D L S I L Q N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R P V P G C R N T R E L L E A H E K V T G G K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y F R F P P E P N G F L H I G H A K S M N L N F
Y F R F P P E P N G F L H I G H A K S M N L N F
CTCGAAGTGCTTGAAGTTCTCGACGCCCTTCTCCGCGTACCCGTGCGACACCACCTCGCTCTTCTCGTCGAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G S A R A H G G K C Y L R Y D D T N P E S E D Q
G S A R A - - - K C Y L R Y D D T N - - - - - Q
GAACTTGAGAAACTC---------GGCGGCACGGTCGTCCTTGAGAAGCGCGTT---------------CAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V Y I D A I M E M V D W M G W K P D W V T F S S
V Y I D A I M E M V D W M . . . . D W V T F S S
CGGCGTACATGCCGTCGCGCTCACCCAGGAGATATTTGT------------TTTACGCTCGAAGTCGATGTC
121122123124125126127128129130131132133134135136137138139140141142143144
D Y F D Q L H T F A V Q L I K D G K A Y V D H S
D - - - - - - - - - - - - - - - - - - - - - - -
TAC---------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T P D E L K Q Q R E Q R E D S P W R N R S V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N L L L F K H M R Q G R Y A E G E A T L R V K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D M K S D N P N M R D F I A Y R V K Y V E H P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I K D K W C I Y P S Y D F T H C L I D S L E D I
- - - - - - - - - S Y D F T H C L I D S - - - -
---------------------------CAGGGTGTTCTCCAGCATGCTGATCTGAATTAC------------
241242243244245246247248249250251252253254255256257258259260261262263264
D Y S L C T L E F E T R R E S Y F W L L N E L N
- Y S L C T L E F E T R R E S Y F W L L N E L -
---GATACCAACCAGCTCGCAGAAGCGGTTAATGGCGGCCGGAGTGTACCCGCGGCGACGCATGCCAGC---
265266267268269270271272273274275276277278279280281282283284285286287288
L W R P Y V W E F S R L N V T G S L L S K R K I
- - - P Y V W E F - - - - - - - - L L S K R - -
---------GCGGGGGTCGTCAAACCC------------------------CACGTTGATCTTGCG------
289290291292293294295296297298299300301302303304305306307308309310311312
N V L V R K G I V R G F D D P R L L T L A G M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R R G Y T P A A I N R F C E L V G I T R S M N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I Q I S M L E N T L R E D L D E R C E R R L M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I D P I K V V V D N W K G E R I F E C P N H P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K P E L G S R A L T F T D T F Y V D R S D F H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D D D N S K F Y G L A P G P R V V G L K Y S G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V V C K S F E V D A K G Q P M V I H V D I D F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R K D K P K T N I S W V S A T A C T P V E V R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y N A L L K D D R A A I D P E F L K F I D E K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E V V S H G Y A E K G V E N F K H F E S V Q A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R F G Y F V V D P D T T A D H L V M N R V L G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570
R E D K S K A T V A E P V P A K R K
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_gln_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A S L G L K I E N E H I N V V S N T T N F I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q I V E D D L K N G K H N K I V T R F P P E P N
- - - - - - - - - - - - - - - V T R F P P E P N
---------------------------------------------GTTTTCCCTAGCTCCCGATTCAGTAAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G F L H L G H A K S I C L N Y G I A K I Y D G R
G F L H L G H A K S I C L N Y G I A K I - - - R
CATTTTGATTAATAGGTCTGGAGATTCTCCGAGCTGTACGGTTAGATTGTATACAAGATT---------ATT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F H L R Y D D T N P Y S E E Q Q Y I D A I E E D
F H L R Y D D T N - - - - - Q Q Y I D A I E E D
CTCTCGTTTAGAATCAACAATATCTCT---------------TCTTTCGAATTGATATCTATTCATCTTTAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V R W L G V D W G E H K Y Y A S D Y F D Q L Y E
V R W L G - - - - E . K Y Y A S D - - - - - - -
TTCTCCTTTACTATT------------ATT---TAAGTTCTTTTCTGAAAA---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
W A K K L I L A G K A Y V D H Q T V E E I R K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R G D S N T P A V E S I Y R N R S I N E N M E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F E R M K D G K C D E G E C V L R A K I D M K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G N P N L R D P I L Y R I L K Q S H P H T G D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
W V I Y P M Y D F A H G Q S D S I E G I T H S I
- - - - - M Y D F A H G Q S D S - - - - - H S I
---------------CTGCTGAGAATCAATTTCTTGATTTTCATCGAA---------------TTCAATCCA
241242243244245246247248249250251252253254255256257258259260261262263264
C T L E F E L H R P L Y D W L Q S E L E I T K T
C T L E F E L H R P L Y D W L Q S E L - - - - T
CAAATTTCTCGTCAAGTACAGGACTCTTTCGCCCATGTCAATATTATCATCAGGATG------------TAT
265266267268269270271272273274275276277278279280281282283284285286287288
R Q I E F A R L N M T Y L V L S K R K L L L L V
R Q I E F - - - - - - - - V L S K R - - - - - -
TTCAACTGCTTCTTT------------------------AATGACTACTTTTAG------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N E K H V A G W D D P R M P T L S A V R R K G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P P Q S L W D F C D K I G A S K R D Q M I H I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L L E D C V K E N L H S I C Q R R F A C I Q P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K V V I I N W D E C F Q K E A V E I T V K N H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D D N I D M G E R V L Y L T R N L W I E K S D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W F D E N Q E I D S Q Q P P G D F K R L F I G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S V R L K Y S Y A I T C K N A I I D T D T K E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K E V H C I I H S S D N E N D S N V N K K K L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A I H W L S T S N V T N V E F R L Y G R L F T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P E P E N Q D K D W R Q F I N N K S L V V I H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F S E K N L L N D E F F N S K G E I K M N R Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F E R I G Y F T R D I V D S K R E N D K I N L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Y N L T V Q L G E S P D L L I K M L T E S G A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E N T K D I E R R N A Y H T N R E K I A A E R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640
A R K L A K E A K K V Q K N N L
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_gln_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H E K K S A F S K T C E S L G I D P N A E Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S S T I E C L N I L V K K V P Q D R L A H R S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L L S K V M S G F S T K Q L N A A I A Y L A S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q S P T I N E V E F D K A C G I G V T Y T E K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I S S A L D K A L A K P D S I K N P Y Q L V S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
M G R D L P W A E H D F L L N L A T E K F A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E E M R I T A H S C E E D A I T T K T S E A A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S K D S P P T G S I H V P P I A Q V L S A I P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q N R Y E Q L L K Y K W Q H K D F L K N L G V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V L T R F P P E P N G Y L H L G H A K A M F I S
- L T R F P P E P N G Y L H L G H A K A M F I S
---CTCACGCGCTTTCCCCCTGAGCCGAATGGATACTTGCATCTGGGCCACGCAAAGGCCATGTTCATTTCC
241242243244245246247248249250251252253254255256257258259260261262263264
F N Y A L L N N G K T Y L R M D D T N P E A E S
F N Y A L L - - - K T Y L R M D D T N - - - - -
TTCAACTATGCTCTTCTT---------AAGACCTATCTTCGTATGGATGATACCAAT---------------
265266267268269270271272273274275276277278279280281282283284285286287288
K E Y I D S I L A S I E W L G H K P F K F T H T
K E Y I D S I L A S I E W L . . . . F K F T H T
AAGGAGTATATTGACTCTATCTTAGCTAGTATCGAGTGGCTG------------TTCAAATTCACACATACC
289290291292293294295296297298299300301302303304305306307308309310311312
S D Y F Q R L Y D V A V E L V R Q G K A Y V C D
S D - - - - - - - - - - - - - - - - - - - - - -
TCCGAC------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q T V E E V A K Y R E E R L D P P G R K R S I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E N L R I F E G M K C G L Y K E S Q Y T L R L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I D M Q S D N P N M R D P I A Y R I K Y C R H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L T G S A W C I Y P S Y D F S H C L I D A F E H
- - - - - - - - - - S Y D F S H C L I D A - - -
------------------------------TCCTATGATTTCTCTCATTGTCTTATCGACGCA---------
409410411412413414415416417418419420421422423424425426427428429430431432
I T H S L C T L E F G I R R E S Y D W V T H N V
- - H S L C T L E F G I R R E S Y D W V T H N V
------CATTCACTATGCACTCTGGAGTTCGGCATTCGTCGAGAATCGTACGACTGGGTCACGCACAATGTC
433434435436437438439440441442443444445446447448449450451452453454455456
H D F R T S D G F D V G Y R P M Q W E F S R L N
- - - - - - - - - - - - - - P M Q W E F - - - -
------------------------------------------CCTATGCAATGGGAATTC------------
457458459460461462463464465466467468469470471472473474475476477478479480
I T Y N V M S K R R L L T L V D K K I V M G W D
- - - - V M S K R - - - - - - - - - - - - - - -
------------GTCATGAGCAAGAGG---------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
D P R L L T L D G L R R R G Y T P S S I N T F C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q V V G I S R N A Q T I D Y H L L E H V L R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L D P I A E R T M A V T S P I R V E L L D F G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D P L D T V P I S Y S L H P K N S E M G T E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K L E R I L Y I D A E D F C E N N T P D F F R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A P G Q P V G L R Y G P L L L V D H F E R R T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K G G D T E L V L Y C T H S W C P E K K E E A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K R L K A E K K Q L T H I H W V S E T G S R V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E V R L F D K L F K S A N P Y E V E G D W I D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V N P N S M V V C P R A R V P R Y V A E Q A K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
N T S P K R Y Q F E R S G Y F I V D T S S T A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763
H L V F N R I V E L R G T F V P P T N
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_gln_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A S R E E Q E K E A E R I F L G I G L A E K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A E T A V S K K K F R G I L L E I I K E A G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N G C D K T R G T L L Y S S A S T Y P D N A R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H R S H F L R E Y I S S G K L K S S E Q L E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F K V L S S Y G S E P V D W Q K L E E A A G V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V V V T P E E I A A A V A S V V K A N E N Q L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T E R Y H T P V G K L L A S V K A S L K W A D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S K V K Q E L D G Q I L N L L G P K T E Q D L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K P D K K K S K V Q S F L A V Q E K K P A K E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G A V S A K N A D T K A E D T E A W R H A D P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A H F K H P A D N N E V H T I V D F S D G S Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
C I A N N A E K L A E H L K I T G G K V V T R F
- - - - - - - - - - - - - - - - - - - - V T R F
------------------------------------------------------------GTGACGCGTTTC
289290291292293294295296297298299300301302303304305306307308309310311312
P P E P N G Y L H I G H A K A M F V D F G F A E
P P E P N G Y L H I G H A K A M F V D F G F A E
CCGCCTGAGCCAAATGGATACCTACACATTGGCCACGCCAAGGCTATGTTTGTTGACTTTGGCTTTGCGGAG
313314315316317318319320321322323324325326327328329330331332333334335336
R Y S G D C Y L R F D D T N P E A E K Q E Y I D
R - - - D C Y L R F D D T N - - - - - Q E Y I D
AGG---------GACTGCTATTTGCGCTTTGATGACACCAAC---------------CAAGAGTACATAGAC
337338339340341342343344345346347348349350351352353354355356357358359360
H I Q D I V A W L G Y K P W K V T Y S S D Y F T
H I Q D I V A W L . . . . W K V T Y S S D - - -
CACATCCAGGACATCGTTGCCTGGCTG------------TGGAAGGTGACATACAGCTCAGAC---------
361362363364365366367368369370371372373374375376377378379380381382383384
E L Y N F A I Q L I R S G N A Y V D H Q T A E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I K A Y R E E R R P S P W R D R P V E E S L Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F E D M R R G L I D E G K A T L R M R M D P K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A N Y N M F D L I A Y R I K F T P H P H A G R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
W C I Y P S Y D Y T H C L V D A L E N I T H S L
- - - - - S Y D Y T H C L V D A - - - - - H S L
---------------TCCTACGACTACACCCACTGCCTGGTGGACGCT---------------CACTCCCTC
481482483484485486487488489490491492493494495496497498499500501502503504
C T L E F E S R R A S Y Y W L L H V L D T Y K P
C T L E F E S R R A S Y Y W L L H V L - - - - P
TGCACGCTCGAGTTCGAGTCTCGCCGCGCCTCCTACTACTGGCTACTGCACGTGCTG------------CCA
505506507508509510511512513514515516517518519520521522523524525526527528
V V W E Y G R L N I T H N V L S K R K L N R L V
V V W E Y - - - - - - - - V L S K R - - - - - -
GTGGTGTGGGAGTAC------------------------GTGCTGTCCAAGCGC------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T D G Y V D G W D D P R L L T L A G L R R R G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
T P Q A I K E L C Q E I G I T R N D S E I H L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K L D H H I R T D L D A T S P R A L A V L D P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R L V L T N L P A D H L Q T F D A K V F P G R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E E T Y P V T L T R V V Y V A A E D F R E V D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K G Y F A L A P Q K E C M L K Y A G I V R C T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F E K S G G K V T E V H A E F R L L E K G E K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P K G V L S W V G Q P M A G Q E P T M F E A R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Y D V L F K T S S V A D T G D E W L Q D L N P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S L T L K T G A I S T P R I T Q A A P G S R F Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L E R L G Y F C V D P D T R I G K L V L N R T C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805
T M K E T N L A A L K G A
- - - - - - - - - - - - -
---------------------------------------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_gln_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_gln_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F D V E S L L K K L N V S E D K K E N I L Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E Q L K K N L E T L Y T N F D T D N K L L F T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A C T A P K K I D I L I F G I L I N E N V I K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D A T L R A S M K F A I K N T D V T Y E E L K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F I L K N T K S K E E V S E I I N K A C L S G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S K K E V Y I I L K N K L P F E D S K Y L M D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V N K F E I D T S K S K K V K D W L E E G E V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
M L H K P G D N P Q L N E K I L K D H L E R T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G K V V T R F P P E P N G I L H I G H A K A I N
- - - V T R F P P E P N G I L H I G H A K A I N
---------GTTACTAGATTCCCCCCAGAGCCAAATGGTATTTTACATATTGGTCATGCAAAAGCTATAAAT
217218219220221222223224225226227228229230231232233234235236237238239240
L D F G Y A E K Y N G I C Y L R F D D T N P R N
L D F G Y A E K - - - I C Y L R F D D T N - - -
CTTGATTTTGGATACGCGGAAAAA---------ATTTGTTATCTTAGATTTGACGATACAAAT---------
241242243244245246247248249250251252253254255256257258259260261262263264
E E D Y Y F E S I I E D V K W L G F E P Y A I T
- - D Y Y F E S I I E D V K W L . . . . Y A I T
------GATTATTATTTCGAATCTATTATTGAAGACGTTAAATGGTTA------------TATGCAATTACA
265266267268269270271272273274275276277278279280281282283284285286287288
S S S K Y F G D M C E L A E K L I L K D K A Y I
S S S K - - - - - - - - - - - - - - - - - - - -
TCGTCAAGTAAA------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
C E L S N E E L K K R R R M L S E A F E T D K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K S I E E L G L I L S P Y R N R E I S E N L K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F R E M V E K K H K E G D Y T L R F K M D I R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K N P M M F D L V G M R I I D C D H V V T K D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y N L Y P S Y E F A L C V S D S L E D V T H S F
- - - - - S Y E F A L C V S D S - - - - - H S F
---------------TCGTACGAATTCGCGCTTTGTGTTTCTGATTCT---------------CATTCTTTT
409410411412413414415416417418419420421422423424425426427428429430431432
C T R E F F T R Q E S Y K W L L D A L E I Y K P
C T R E F F T R Q E S Y K W L L D A L - - - - P
TGCACTCGAGAATTTTTTACTAGACAAGAAAGTTATAAATGGCTTTTGGATGCATTA------------CCA
433434435436437438439440441442443444445446447448449450451452453454455456
V Q W E F S R L N I S N T V L S K R K I V P L K
V Q W E F - - - - - - - - V L S K R - - - - - -
GTTCAATGGGAGTTT------------------------GTATTAAGTAAAAGA------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K Y G I E L D D P R L Y T I K G M R R R G I P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q A I N N F V K S L G I T Y A E T I I D N K K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E S F I R D E L N K T T Q R V M C V M D P L K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y I R N A K E Q E I S I P N S N Q K I I F K P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I Y I E K S D F K M E D D D K D F L R F T P N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
S V G L Y M F G A I K F I K F D N D M I I A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T N E T P K K F I H W V S C D S I K V T I R L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D P L F R S F N P E E G N Y L D N I N L D S L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
T V V G Y C D D R I K G C E V E D K F Q F Q R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695
G Y F C V D P D T T P E N I V F N R I I T L I
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_glu_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D D V R S V L L I A A L S N A V K H K S V P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A G A V M G A I L G T H P E L R S K A G E I K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L L G S V L E E V S S L S A E D R E E K L K T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A P D Q Y A S L F E K K E K K K I G L P D L P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E G G V V M R F A P N P S G P L H L G H A R A
- - - - - V M R F A P N P S G P L H L G H A R A
---------------TGCACCAGATTCAAGTTCAGCCTTTGGCAGGTAGAGACTTCCGGCAAAGGGAATCTC
121122123124125126127128129130131132133134135136137138139140141142143144
A F L N D E Y I R R Y G G K Y I L R I E D T D P
A F L N D E Y I R R - - - K Y I L R I E D T D -
ACGGTATCCCCTCGATTCATCTCCCGGATA---------TTTTGCCACAACCGGGTCACTTCCGGATAC---
145146147148149150151152153154155156157158159160161162163164165166167168
K R V D P D A Y D M V R E D I A W M G L S I A E
- - - - P D A Y D M V R E D I A W M . . . . A -
------------ATCAGGAACAAAGAAGAACCGGTCAGCCTGACTGTCAATGAT------------TGC---
169170171172173174175176177178179180181182183184185186187188189190191192
T I F Q S D R F S K Y Y E V G K E L I Q K G H A
T I F Q S D - - - - - - - - - - - - - - - - - -
GAGGTTTTCCCATGAGAA------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y V C R C D N E K F K D L K M H K T A C P C R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q S P E E A L D L F D Q M L D G A F T E G E V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V R L K T D L S H P D P A M R D Y P L F R V L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S T P H Q R V D A I V Y P L M N L S V A V D D H
- - - - - - - - - - - - - L M N L S V A V D D H
---------------------------------------TACCGCCACGGAGAGGTTCATGAGCGGGTATAC
289290291292293294295296297298299300301302303304305306307308309310311312
L L G M T H V I R G K D H I A N T K R Q E F I F
- - - - - H V I R G K D H I A N T K R Q E F I F
---------------CTGGTGAGGAGTGGACGTGAGAACCCGGAATAGCGGATAATCACGCATGGCCGGGTC
313314315316317318319320321322323324325326327328329330331332333334335336
R Y M G W E T P V Y R H Y G R M G I E G V V L S
R Y M - - - - P V Y R H Y - - - - - - - - V L S
AGGATGAGA------------TAACCTGACCCCAACCTC------------------------CATCTGGTC
337338339340341342343344345346347348349350351352353354355356357358359360
T S Q M R A G I Q S G E Y S G W D D V R L G T L
T S - - - - - - - - - - - - - - - - - - - - - -
AAAGAG------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A M A R R G I Q P Q A V R N A V V E I G I G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T D I Q F S W E N L Y A K N K E I I D S Q A D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F F F V P D P V L V P V S G S D P V V A K A M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y P G D E S R G Y R E I P F A G S L Y L P K A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L E S G A A Y I R L K D L F N I K V L Y E G D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I R G E Y A G D D L Q E A R S K K A P I I Q W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P E N H A N P C T L K T P D G D V S G V C E P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A V T T Q D R I V Q F E R V G F A R I D A A G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561
P A V A Y F T H R
- - - - - - - - -
---------------------------
Class I
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_glu_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E E K I L P I A L R N A I K Y N G K A N P K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V L G I F L S E N P E Y R S K A K E V M P I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K V V E E V N K L S L D E I K K K L E E L G E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V K K K E K K E K G L E L P N V K D K V V M R F
- - - - - - - - - - - - - - - - - - - - V M R F
------------------------------------------------------------AACTATGTTAAA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A P N P S G P L H I G H A R A A V L N D Y F V K
A P N P S G P L H I G H A R A A V L N D Y F V K
TAACTCCATCAATCTATACATCTTATTCTCTTCCAACTCATCTCCAACAACATAAACCTCTCCATCAAATAT
121122123124125126127128129130131132133134135136137138139140141142143144
K Y G G K L I L R L E D T D P K R V L P E A Y D
K - - - K L I L R L E D T D - - - - - P E A Y D
TAA---------TCCAAATTCTGGTCTATCTGGATGCATTCT---------------TTTCTCTGCCCCTTC
145146147148149150151152153154155156157158159160161162163164165166167168
M I K E D L D W L G V K V D E V V I Q S D R I E
M I K E D L D W L . . . . D - V V I Q S D - - -
GATAATAAGTTTCTTTGGATTCCAGAC------------CCT---ATCTTTATCAATAAGCTC---------
169170171172173174175176177178179180181182183184185186187188189190191192
L Y Y E Y G R K L I E M G H A Y V C D C N P E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F R E L R N K G V P C K C R D R A I E D N L E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
W E K M L N G E L E N V A V R L K T D I K H K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P S I R D F P I F R V E K T P H P R T G D K Y C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V Y P L M N F S V P V D D H L L G M T H V L R G
- - - L M N F S V P V D D H - - - - - H V L R G
---------TCTCAAAACATGAGTCATTCCTAAAAGATGATC---------------GAAGTTCATTAAAGG
289290291292293294295296297298299300301302303304305306307308309310311312
K D H I V N T E K Q A Y I Y K Y F G W E M P E F
K D H I V N T E K Q A Y I Y K Y F - - - - P E F
ATATACACAGTATTTATCTCCAGTTCTTGGATGTGGAGTTTTTTCAACTCT------------GTCCCTAAT
313314315316317318319320321322323324325326327328329330331332333334335336
I H Y G I L K I E D I V L S T S S M Y K G I K E
I H Y - - - - - - - - V L S T S - - - - - - - -
TGATGGGTT------------------------TCTAACAGCTACATT------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G L Y S G W D D V R L G T L R A L R R R G I K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E A I Y E I M K R I G I K Q A D V K F S W E N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y A I N K E L I D K D A R R F F F V W N P K K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I I E G A E K K V L K L R M H P D R P E F G E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E L I F D G E V Y V V G D E L E E N K M Y R L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E L F N I V V E K V D D I A L A K Y H S D D F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I A R K N K A K I I H W I P V K D S V K V K V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
M P D G E I K E G F A E K D F A K V E V D D I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Q F E R F G F V R I D K K D N D G F V C C Y A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553
R
-
---
Class I
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_glu_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E E K E L R D L V R R Y A L E N A A R Y G G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A N P N A V M K K I M K E H E E L R P R A K E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L K T V R E V V R E V N K M S G E E I R R E L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E L G G P R E D V A R D K E G L K P L P G A E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G N V R L R F A P N P S G P L H I G H A R A A V
- - - R L R F A P N P S G P L H I G H A R A A V
---------CATCAGCCGAACTACGTCGCCCTCCCACAGGTCTTCTGCGTCTTCACCGTCCAACAGTGCTCG
121122123124125126127128129130131132133134135136137138139140141142143144
L N D E Y A R R Y D G T L V L R I E D T D P R R
L N D E Y A R R - - - T L V L R I E D T D - - -
GGCCACGCCGTTCTCAGGATGTAG---------CCTCTCTCCCTCATCCCGATCGGGGTGTAG---------
145146147148149150151152153154155156157158159160161162163164165166167168
V D P E A Y D M I E E D L E W L G V N I D E R Y
- - P E A Y D M I E E D L E W L . . . . D - R Y
------GACCGACTCCTTCATCCCTTCGATCCGTAATTCGACAGGATC------------GTA---GTGAGA
169170171172173174175176177178179180181182183184185186187188189190191192
V Q S N R I E L Y Y M V C E E L L E R E G A Y V
V Q S N - - - - - - - - - - - - - - - - - - - -
CTCAGGGTCGAT------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C T C D P D E F R R L R D V G R A C P C R S R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K E E N L E L W E E M L D G T F S E G E A V V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V K T E V D H P D P A V R E W I A F R I V E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H P M T G S R Y L V W P T M N F A V A V D D H L
- - - - - - - - - - - - T M N F A V A V D D H -
------------------------------------ACGAAGTACGTGCGTGATGTTCATGAGATGGTC---
289290291292293294295296297298299300301302303304305306307308309310311312
M N I T H V L R G K D H E S N T R R Q K Y V F E
- - - - H V L R G K D H E S N T R R Q K Y V F E
------------GAAGTTCATCGTCGGCCACACAAGGTACCGAGAACCCGTCATCGGGTGCTCTTCTTCGAC
313314315316317318319320321322323324325326327328329330331332333334335336
H L G W D T P E Y V H Y G I L K V E G A V L S T
H L - - - - P E Y V H Y - - - - - - - - V L S T
GATCCT------------CTCCCTCACCGCGGGATC------------------------ACGTACGACGGC
337338339340341342343344345346347348349350351352353354355356357358359360
S E I R R G I D S G E Y T G W D D V R V A T L R
S - - - - - - - - - - - - - - - - - - - - - - -
TTC---------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A L R R R G I K P E A I R E T I L E I G L T D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D A T F S W E H L Y A R N R K M I D P E S H R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F F V R D P V E L R I E G M K E S V L A R L P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
H P D R D E G E R V L I L H P E N G V A R A L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D G E D A E D L W E G D V V R L M N A V N V E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E E V G D G W L R G R Y H S D D Y R I A K E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A Q I V H W V P P D Q A V R C E V V R P D G S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E S G Y A E I N V E R E Q A G S T V Q F E R L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571
F V R L E E V S S G G V R A V Y A H D
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_glu_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V P V E D L V Y R Y A L L N A V K H R G R A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P G A V M G A V M S N E P E L R K M A P Q V K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A V E A A V E R V N S L S P E E Q Q Q E M E R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G L E I T E R K Q K K R K G L R E L A G V K G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V V L R F A P N P S G P L H I G H A R A A I L N
- - L R F A P N P S G P L H I G H A R A A I L N
------CTCAGGTTCGCCCCCAACCCCAGCGGACCCCTCCACATAGGCCATGCAAGGGCCGCGATCCTCAAC
121122123124125126127128129130131132133134135136137138139140141142143144
H E Y A R K Y D G R L I L R I E D T D P R R V D
H E Y A R K - - - R L I L R I E D T D - - - - -
CATGAATATGCAAGGAAA---------AGGCTCATCCTCAGGATAGAGGACACGGAC---------------
145146147148149150151152153154155156157158159160161162163164165166167168
P E A Y D M I P A D L E W L G V E W D E T V I Q
P E A Y D M I P A D L E W L . . . . D - T V I Q
CCGGAGGCCTACGATATGATTCCAGCCGACCTTGAGTGGCTG------------GAT---ACAGTTATCCAG
169170171172173174175176177178179180181182183184185186187188189190191192
S D R M E T Y Y E Y T E K L I E R G G A Y V C T
S D - - - - - - - - - - - - - - - - - - - - - -
AGCGAC------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C R P E E F R E L K N R G E A C H C R S L G F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E N L Q R W R E M F E M K E G S A V V R V K T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L N H P N P A I R D W V S M R I V E A E H P R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G T R Y R V Y P M M N F S V A V D D H L L G V T
- - - - - - - - M M N F S V A V D D H - - - - -
------------------------ATGATGAACTTCTCAGTGGCGGTTGATGACCAC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
H V L R G K D H L A N R E K Q E Y L Y R H L G W
H V L R G K D H L A N R E K Q E Y L Y R H L - -
CACGTCCTGAGGGGTAAGGACCACCTGGCAAACAGAGAGAAGCAGGAGTACCTCTACAGGCACCTT------
313314315316317318319320321322323324325326327328329330331332333334335336
E P P E F I H Y G R L K M D D V A L S T S G A R
- - P E F I H Y - - - - - - - V . L S T S - - -
------CCCGAATTCATACACTAC---------------------GTT---CTCAGCACCTCG---------
337338339340341342343344345346347348349350351352353354355356357358359360
E G I L R G E Y S G W D D P R L G T L R A I A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R G I R P E A I R K L M V E I G V K I A D S T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S W K K I Y G L N R S I L E E E A R R Y F F A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D P V K L E V V G L P G P V R V E R P L H P D H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P E I G N R V L E L R G E V Y L P G D D L G E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P L R L I D A V N V I Y S G G E L R Y H S E G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E E A R E L G A S M I H W V P A E S A L E A E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I M P D A S R V R G V I E A D A S E L E V D D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V Q L E R F G F A R L D S A G P G M V F Y Y A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553
K
-
---
Class I
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_glu_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N V E E I A F K Y A L A N A V K Y G G K A D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K A V M A K L M A E V P E L R A R A R E V K Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V D A V V A R V N S M P L E E Q R R I L R E R W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P E L L E E R R A E Q R R P G L E G L P E L P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V R G G V V V R F A P N P D F V L H L G S A R P
- - - - - V V R F A P N P D F V L H L G S A R P
---------------GTAGTGCGCTTCGCCCCCAATCCCGACTTTGTTTTACACTTAGGCAGTGCGCGGCCT
121122123124125126127128129130131132133134135136137138139140141142143144
A I L N Y A Y R I K Y G G K F I L R F E D T D P
A I L N Y A Y R I K - - - K F I L R F E D T D -
GCTATTTTAAACTACGCCTATAGGATTAAA---------AAGTTCATATTGCGGTTTGAAGACACAGAT---
145146147148149150151152153154155156157158159160161162163164165166167168
R I K S P L V T E E V N A Y E S I R E D L R W L
- - - - P . . . . . . N A Y E S I R E D L R W L
------------CCG------------------AACGCCTATGAATCCATTAGGGAGGACTTAAGGTGGCTG
169170171172173174175176177178179180181182183184185186187188189190191192
G V R W D E E Y I Q S Q R M E I Y Y E H A K K L
. . . . D E - Y I Q S Q - - - - - - - - - - - -
------------GACGAG---TATATACAGTCCCAA------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L E M G A A Y V D L C K P E E W R R L R N E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A C P H R E Q P P E V N L E L W D K M L E G R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K E G E A V L R I K T D L T H P D P S V R D W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A F R I I D T S K T P H P L T G D K Y I V W P T
- - - - - - - - - - - - - - - - - - - - - - - T
---------------------------------------------------------------------ACT
289290291292293294295296297298299300301302303304305306307308309310311312
Y N F A V S I D D H L M G V T H V L R A Q E H S
Y N F A V S I D D H - - - - - H V L R A Q E H S
TATAACTTCGCGGTTTCTATAGATGACCAC---------------CACGTGTTGAGAGCACAGGAACACAGC
313314315316317318319320321322323324325326327328329330331332333334335336
V N T I K Q S Y V F R H F G W E Q P V T I H F G
V N T I K Q S Y V F R H F - - - - P V T I H F -
GTTAATACCATTAAACAGTCATACGTATTTAGACACTTC------------CCGGTCACTATCCACTTC---
337338339340341342343344345346347348349350351352353354355356357358359360
R L R I E G A T L S K S K L K A M R I K Y D D L
- - - - - - - T L S K S - - - - - - - - - - - -
---------------------ACTCTGAGTAAGTCT------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T L P T L A G L R N R G I V P E A I W D L I L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V G I K P S D S T V A L A N L F A F N R K H I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P I A D R Y M Y V A D P V K L V F E A D K E L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A H V P F H P S F K E R G E R T Y R L G P G R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E V Y I Q R R D A V A G K V V R L M E L A N V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I V R V E G D V A Y G R I H S Y S L D E A K K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G A P I I Q W V W D P V E I T V I K P A G V G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K E V E V G L G E G W L E R V E V G K Y V Q F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570
R Y G Y L K K R G P R E F V F L H D
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_glu_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K Y N P D E L R E L A R A Y A L V N A V E H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G R A A V G P V M G K I M A E K P E L R P H A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E I V A I V R E V V A E V N K L S L D E Q K R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L E E K Y S W V L E K L S K P K E Q E K T L P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L P G A E E G K I V T R F A P N P D F V I H L G
- - - - - - - - - V T R F A P N P D F V I H L G
---------------------------AGCCTCCATGAGCCTTACAATACTGCCTTTCTTTAGTAGCTTCTT
121122123124125126127128129130131132133134135136137138139140141142143144
N A R P A I L S Y E Y K V I Y K G K M I L R F E
N A R P A I L S Y E Y K V I - - - K M I L R F E
ATCGCTCTGCGATATATAGACTGTTGCTGTTGGTCCTTCTAG---------TCTTGAACCTAGTTTGCCCGA
145146147148149150151152153154155156157158159160161162163164165166167168
D T D P R T K T P L P E A Y E L I K Q D L E W L
D T D - - - - - - - P E A Y E L I K Q D L E W L
CGGATGATA---------------------CTCCCATGGCAAGTTTTCTATAATCATTGGCGTCGGCGGTAT
169170171172173174175176177178179180181182183184185186187188189190191192
G I R W D E E Y I Q S L R M P I Y Y Q I I K E L
. . . . D E - Y I Q S L - - - - - - - - - - - -
------------TCTACG---TGTGGGGTCTACTAT------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L E K G H A Y V D D K P G E E F R K Y R N S G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L S E Y P P R L R T A E E N L E L W D Q M L E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R F A E G E A V V R I K T D P N H P D P S V R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
W V A F R I I D T S R Y P H P L V G D R Y I V W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P T Y N F A A G V D D W L M G V T H I L R A K E
- T Y N F A A G V D D W - - - - - H I L R A K E
---ACCCATTAGCCAGTCATCAACGCCGGCTGCGAA---------------GACGATGTAGCGATCGCCGAC
313314315316317318319320321322323324325326327328329330331332333334335336
H M Q N T I K Q K Y V Y E Y M G W K Y P H V V H
H M Q N T I K Q K Y V Y E Y M - - - - P H V V H
TAGCGGGTGAGGATAGCGGCTTGTATCGATTATCCGGAATGCTAC------------GCTCGGGTCTGGGTG
337338339340341342343344345346347348349350351352353354355356357358359360
F G R L K L E G F I M S K S A L K Q L L D Q G V
F - - - - - - - - I M S K S - - - - - - - - - -
ATT------------------------TGCCTCGCCCTCGGC------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S S G I D D P R F A T I A G L R R R G I T A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I R K L I L D V G V K Y T D A S I S Y T N L A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T N R V I V D P T A R R I M A A I P P T P M I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E N L P W E K R E F E I P Y H P S G K L G S R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I S L E G P T A T V Y I S Q S D K K L L K K G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I V R L M E A F N V E I V D I E G D K I R A R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H S L G L E D A R K H R A L I I Q W I P G D A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L Q I E L L V P E G L D L I Q R R G I V E Q A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A E L K Q G D I V Q L V R I G F A R V D A L E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591
E D G S V R K V V M V F A H E
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Archaea/Archaeoglobus fulgidus/amino acid sequences/glu_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K Y V V Q N A A K Y G K A N E K A V M G K V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A E N P E L R K K A K E V L E M V R E C I N E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E A L S E E K K R E L I Q K Y S A E G E A K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S E T R G L P E L E G A E K G K V V M R F A P N
- - - - - - - - - - - - - - - - - V M R F A P N
---------------------------------------------------CAGCCTTACAACCTGCCCTTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P N G P P T L G S A R G I I V N G E Y A R M Y E
P N G P P T L G S A R G I I V N G E Y A R M - -
CAACCTCTCGAAGTCGTCTTTTGTAACATATATAGTTCTTTCACCTTTCAGCCTTCTCTTCTCGCC------
121122123124125126127128129130131132133134135136137138139140141142143144
G K Y I I R F D D T D P R T K R P M L E A Y D W
- K Y I I R F D D T D - - - - - P . . E A Y D W
---ATTCAGCGGGAGCTCGACCTCTTTCTTCTC---------------TTC------CACGGGCCCCCAAAT
145146147148149150151152153154155156157158159160161162163164165166167168
Y L E D I E W L G Y K P D E V I Y A S K R I P I
Y L E D I E W L . . . . D - V I Y A S K - - - -
GAAAAAGTAACGGTTTGCCTTGCG------------CCT---CTCAGCGTAAAGATTCTT------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y Y D Y A R K L I E M G K A Y T C F C S Q A E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K K F R D S G E E C P H R N I S V E D A L E V W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E R M L E G D Y E E G E V V L R I K T D M K H K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D P A I R D W V A F R I I K E V H P L V G D K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V V Y P T L D F E S A I E D H L L G V T H I I R
- - - - T L D F E S A I E D H - - - - - H I I R
------------GTGGTCCTCAATCGCGGACTCAAAATCGAGTGT---------------CTTGTCCCCAAC
289290291292293294295296297298299300301302303304305306307308309310311312
G K D L I D S E R R Q R Y I Y E Y F G W V Y P I
G K D L I D S E R R Q R Y I Y E Y F - - - - P I
GAGAGGATGCACCTCCTTTATTATTCTGAACGCCACCCAGTCCCTTATCGCCGG------------CATGTC
313314315316317318319320321322323324325326327328329330331332333334335336
T K H W G R V K I F E F G K L S T S S I K K D I
T K H W - - - - - - - - - K L S T S - - - - - -
CGTCTTGATTCT---------------------------CCCCTCAAGCATTCT------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E R G K Y E G W D D P R L P T L R A F R R R G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E P E A I K S F F L S L G V G E N D V S V S L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N L Y A E N R K I I D R K A N R Y F F I W G P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K I E I V N L P E K K E V E L P L N P H T G E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R R L K G E R T I Y V T K D D F E R L K G Q V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R L K D F C N V L L D E K A E F M G F E L E G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K K G K N I I H W L P E S E A I K G K V I G E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E A E G L V E R N A V R D V G K V V Q F E R F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546
F C K V E S A D E E L V A V Y T H P
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_glu_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L N A V E H G G R A A V G P V M G K I M A E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P D L R A H A R E I A G I V R E I V A E V N K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P L E E Q K R L L E E H Y S W V K E R L A K P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E Q E R G L P P L P G A E E G K V V T R F A P N
- - - - - - - - - - - - - - - - - V T R F A P N
---------------------------------------------------GTAACACGCTTCGCCCCTAAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P D F I I H L G N A R P A I L S Y E Y K V M Y K
P D F I I H L G N A R P A I L S Y E Y K V M - -
CCGGACTTCATAATACACTTGGGCAACGCTAGACCAGCAATACTGAGCTACGAGTACAAGGTCATG------
121122123124125126127128129130131132133134135136137138139140141142143144
G R M I L R F E D T D P R T K T P L P E A Y E L
- R M I L R F E D T D - - - - - - - P E A Y E L
---AGGATGATTCTCCGCTTCGAGGATACAGAT---------------------CCGGAGGCCTACGAGCTC
145146147148149150151152153154155156157158159160161162163164165166167168
I K Q D L K W L G V R W D E E Y I Q S L R I P I
I K Q D L K W L . . . . D E - Y I Q S L - - - -
ATAAAGCAGGATCTCAAGTGGCTC------------GACGAG---TACATACAGAGCCTG------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y Y Q V A R Q L L E K G H A Y V D D R P A E E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R R Y R D A G K L A E Y P P R L R A P E E N L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L W D R M L E G W L S E G E A V V R I K T D P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H P D P S V R D W V A L R I I D T S R H P H P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V G D R Y V V W P T Y N L A A A V D D H M M G V
- - - - - - - - - T Y N L A A A V D D H - - - -
---------------------------ACTTACAACCTGGCAGCGGCAGTAGATGACCAC------------
289290291292293294295296297298299300301302303304305306307308309310311312
T H I L R A K E H M Q N T I K Q K Y I Y G Y M G
- H I L R A K E H M Q N T I K Q K Y I Y G Y M -
---CACATACTGAGGGCCAAGGAGCATATGCAGAACACTATCAAGCAGAAATACATATACGGCTACATG---
313314315316317318319320321322323324325326327328329330331332333334335336
W K Y P N V I H F G R L K L E G F I M S K S T L
- - - P N V I H F - - - - - - - - I M S K S - -
---------CCGAACGTCATTCACTTT------------------------ATAATGAGCAAGTCT------
337338339340341342343344345346347348349350351352353354355356357358359360
K R L L D Q G I G A G L D D P R F A T I A G L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R R G I T A E A I R R V I L D V G V K Y T D A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I S Y A N L A A V N R A I V D P A A R R I M A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I P P L P L V V N D I P W E E R W L E I P Y H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S G K L G S R R I L V K G P S T T I Y V S R S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R G L L E P G R V V R L M E A F N I E V V D A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E S R V V A R F H S M G L E E A R K H Q A P I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q W V P G D A A L Q L E L L V P E G L D L V Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R G L V E A A A A E L R P G E V V Q L V R M G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575
A R V D A L E T E D G S A R K I V A I F A H E
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_glu_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S N D I R N L V Y K Y A L H N A Y T H N G K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N V N A V V S K I F A E R P E L R S K A K D I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E I A K E L V N Y V N S L D V E S Q K K E L E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K F P E M L E E K K R E K E S K K E L P D I P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S G V L V T R F A P N P D G P L H L G N A R A A
- - - - V T R F A P N P D G P L H L G N A R A A
------------GTGACTCGTTTTGCTCCTAATCCCGATGGTCCTCTTCACCTTGGAAACGCTAGAGCAGCT
121122123124125126127128129130131132133134135136137138139140141142143144
I I S H E Y A R I Y N G K F I L R F D D T D P K
I I S H E Y A R I - - - K F I L R F D D T D - -
ATAATATCTCATGAATACGCTAGAATA---------AAATTTATACTTCGATTTGATGACACTGAT------
145146147148149150151152153154155156157158159160161162163164165166167168
T K K P I P E A Y D W I K E D L K W L G I K W D
- - - - - P E A Y D W I K E D L K W L . . . . D
---------------CCTGAGGCTTATGATTGGATAAAAGAAGACCTGAAATGGCTA------------GAC
169170171172173174175176177178179180181182183184185186187188189190191192
L E V R A S A R L E T Y Y N F A R I L L S K G Y
- E V R A S A - - - - - - - - - - - - - - - - -
---GAAGTAAGAGCCTCAGCA---------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A Y I D L C K E A E F K E R R S K R E A C P H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E T S P E S N L E L F E K M I H G E F E E G K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V V R L K T D L K L P D P S Q R D W V L L R V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N V K K S P H P I E G D K Y W V W P T Y N F A S
- - - - - - - - - - - - - - - - - - T Y N F A S
------------------------------------------------------ACATATAATTTTGCAAGC
289290291292293294295296297298299300301302303304305306307308309310311312
A I D D Y D L G V T H I F R G K E H A V N A G K
A I D D Y - - - - - H I F R G K E H A V N A G K
GCTATTGATGATTAC---------------CACATTTTCAGAGGAAAGGAGCATGCTGTTAATGCAGGAAAA
313314315316317318319320321322323324325326327328329330331332333334335336
Q K W I Y N Y M G W K Y P Y V R E F G R L K L E
Q K W I Y N Y M - - - - P Y V R E F - - - - - -
CAGAAATGGATCTATAACTATATG------------CCTTACGTTAGGGAATTT------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G F M M S K S K I R T V V E K G V S I D D P R L
- - M M S K S - - - - - - - - - - - - - - - - -
------ATGATGAGTAAATCA---------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P T L A G L R R R G I L S D T I K E I I I T V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L K E T D A T I S F D N L A S T N R K K L D K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A K R L M F V E S P M E F T I D I P Q P M L A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I P Y H P S N P N E Y R E I G V N P G D I I L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N K D D A K D K V L R L M E L C N V T V N E D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L V Y N S K G I E D A K K L G M K I I Q W V K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D E S V P V V I L R P D P E K G I E T I N G V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E S V I R S L N K G E I V Q F I R Y G F V K V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567
E I S T D G Q V T V I F S H E
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Archaea/Staphylothermus marinus/Smarinus_glu_aa
Archaea/Staphylothermus marinus/Smarinus_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L N A Y K H S G K A E L K P V I S K I I A E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P E I R R H V R E V I D I V R E T I N E V N Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P I E K Q K E I I E K N W P E L L E E K P R T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E K S L P P L P N A A K G R V V T R F A P N P D
- - - - - - - - - - - - - - - V T R F A P N P D
---------------------------------------------GTAACAAGATTCGCTCCTAATCCAGAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y T I H L G N A R P A L L S Y W Y A E M Y E G K
Y T I H L G N A R P A L L S Y W Y A E M - - - K
TATACTATCCATTTGGGAAATGCTAGGCCCGCACTTCTCAGTTATTGGTATGCTGAAATG---------AAA
121122123124125126127128129130131132133134135136137138139140141142143144
M I L R F E D T D P R T K A P F P E A Y D R I R
M I L R F E D T D - - - - - - - P E A Y D R I R
ATGATTCTAAGATTCGAAGACACCGAT---------------------CCAGAAGCATATGATAGGATAAGA
145146147148149150151152153154155156157158159160161162163164165166167168
N D L K W L G I K W N E E Y I Q S L R L P I L Y
N D L K W L . . . . N E - Y I Q S L - - - - - -
AATGATCTTAAATGGCTA------------AACGAA---TATATTCAAAGTCTA------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N A L R E L I K H G G A Y V D K C S P K E F K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L R D S G K P C P H R E L P P E K H L E E L D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I F E G Y Y S E G E A V V R V K T D L S H P D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S V R D W V A A R I I D T S K T P H P I V G D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y I L W P T Y N L A A A I D D H L M G V T H I L
- - - - - T Y N L A A A I D D H - - - - - H I L
---------------ACATATAATCTAGCTGCTGCAATAGATGATCAC---------------CATATACTT
289290291292293294295296297298299300301302303304305306307308309310311312
R A K E H V S N T I K Q K F L Y D H M G W K Y P
R A K E H V S N T I K Q K F L Y D H M - - - - P
AGAGCTAAAGAACATGTTTCAAATACTATTAAACAAAAATTCCTATATGATCATATG------------CCG
313314315316317318319320321322323324325326327328329330331332333334335336
E T I H F G R L S L E G V I L S K S R M R K M I
E T I H F - - - - - - - - I L S K S - - - - - -
GAAACAATACATTTT------------------------ATTTTGAGTAAGTCT------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V E Y N M E P Y D D P R F G T L S G L R R R G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V R E T L W R I I K D V G I N V I D A R I S Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N L A A I N R S I I D P Q A K R Y M A I E E A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P L K L I G F N N S I E A H V L R H P S T R E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y N Y I I K P G D I V Y I S Q K D F N I I Q N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
M F R L M G I G N F A L T R P V F S K N Y I G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E A R L I S L S A K E A K Q Y R A P I I Q W V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L E Q S I R V K L I I P K E T N L E T R I L L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E K A L T N E E L G N I V Q F Y R I G F A R I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566
S K E P E E I K C I F A H E
- - - - - - - - - - - - - -
------------------------------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_glu_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M M M Y E D D I R R I A L I N A Y Q H E G K A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L K S V M G K V M A E I P D L R R D P R S A R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M V S R I V D E V N S M S A Y E I R E T V E T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y T S S I R K E K K V E E H R L P D L E G V N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P V V M R M A P S P S G P L H I G H T R M A I L
- - V M R M A P S P S G P L H I G H T R M A I L
------GTAATGAGGATGGCCCCATCTCCGTCCGGACCACTGCATATTGGCCACACCAGGATGGCAATACTC
121122123124125126127128129130131132133134135136137138139140141142143144
N D E Y V K R Y G G E L I L R I E D T N P K N I
N D E Y V K R - - - E L I L R I E D T N - - - -
AACGACGAGTATGTCAAAAGG---------GAACTGATTCTCAGGATAGAGGATACAAAT------------
145146147148149150151152153154155156157158159160161162163164165166167168
D P D A Y H M I P E D L E W L G V N V T K I V I
- P D A Y H M I P E D L E W L . . . . T - I V I
---CCAGATGCATATCATATGATACCGGAGGATCTTGAATGGCTT------------ACG---ATCGTTATA
169170171172173174175176177178179180181182183184185186187188189190191192
Q S D R F D L Y Y A E A K K L M E N G H M Y V C
Q S D - - - - - - - - - - - - - - - - - - - - -
CAGAGTGAC---------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T C P R E E F K K R K L E S I P C K D R D N P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E T N L E L F D K M I D G T I K E G D A V A V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K T D L K H P N P S V R D W I A F R I I E A R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P R V D D K Y R V Y P M M S F S V A V D D H Y L
- - - - - - - - - - - M M S F S V A V D D H - -
---------------------------------ATGATGAGCTTCAGCGTTGCCGTGGACGACCAT------
289290291292293294295296297298299300301302303304305306307308309310311312
G L T H V L R G K D Q L T N T D K Q R Y I F D Y
- - - H V L R G K D Q L T N T D K Q R Y I F D Y
---------CATGTCCTTAGAGGAAAGGATCAGCTCACAAACACCGACAAACAGAGGTACATTTTCGATTAC
313314315316317318319320321322323324325326327328329330331332333334335336
N G W K K P Y Y Y H Y G M I K F P G I K L K T S
N - - - - P Y Y Y H Y - - - - - - - - K L K T S
AAT------------CCATACTATTACCATTAT------------------------AAGCTGAAAACATCT
337338339340341342343344345346347348349350351352353354355356357358359360
L M K K G I L S G Q Y E G W S D I R L G T V R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F A K R G Y R P E T F R R Y W I N S G L R E I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A I F S I E I F D S I N R E I V D P R A Y R F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F V K D P V P V R I E G M P N I S A K L P L H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T H P E Y G F R E Y E V K G S V Y I A S R D F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A I S E G E R I R L K D L C Y I R K K G N G I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y D G V E M T E K T K I I N W C P E G S R D F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V L K P D G S K D S G L I E P K S S G Y R G I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550
Q L E R Y G Y V N F A D G D D L A Y F T H P
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_glu_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y E E E I K K I A L L N A Y Q H N G K A E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S V I G K V M A E I A D L R K N P K L V S E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K A A V D S V N S M S K D D I V N I V E K Q F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E A L K K D K K P E E H R L P D L Q G V N G H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V M R L A P S P S G P L H I G H T R M A I L N D
V M R L A P S P S G P L H I G H T R M A I L N D
GTTATGAGGCTTGCACCGTCTCCATCAGGGCCTCTCCACATAGGCCATACCAGGATGGCTATTCTTAACGAC
121122123124125126127128129130131132133134135136137138139140141142143144
E Y V K R Y G G D L I L R I E D T N P T N I D P
E Y V K R - - - D L I L R I E D T N - - - - - P
GAATATGTCAAAAGA---------GACCTTATACTTCGTATAGAAGACACAAAT---------------CCA
145146147148149150151152153154155156157158159160161162163164165166167168
E A Y A M I P E D L E W L G V N V T K T V I Q S
E A Y A M I P E D L E W L . . . . T - T V I Q S
GAAGCTTATGCTATGATTCCAGAGGATCTAGAGTGGCTA------------ACG---ACAGTAATACAGAGT
169170171172173174175176177178179180181182183184185186187188189190191192
E R F D L Y Y S V A K K L I E N G H L Y I C T C
E - - - - - - - - - - - - - - - - - - - - - - -
GAA---------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D R E E F K R K K L A S I P C K D R D N P P E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N L Y L F E K M L D G E I K A G A A V A V M K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D L N H P N P S V R D W I A F R I I D A K H P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T G D K Y R V F P M M S F S V A V D D H Y L G L
- - - - - - - - - M M S F S V A V D D H - - - -
---------------------------ATGATGAGTTTCAGCGTGGCAGTTGATGATCAT------------
289290291292293294295296297298299300301302303304305306307308309310311312
T H V L R G K D Q L T N T E K Q R Y V F E Y N G
- H V L R G K D Q L T N T E K Q R Y V F E Y N -
---CATGTACTCAGGGGCAAGGATCAGTTGACGAACACTGAAAAGCAGAGGTATGTCTTCGAATACAAT---
313314315316317318319320321322323324325326327328329330331332333334335336
W N K P Y Y Y H Y G M I R F P G T R L K T S L M
- - - P Y Y Y H Y - - - - - - - - R L K T S - -
---------CCATATTATTACCATTAT------------------------AGACTTAAAACCTCC------
337338339340341342343344345346347348349350351352353354355356357358359360
K K G I Q A G Q Y D G W S D V R L G T V R A M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R R G Y Q P E T F R R Y W I N S G L R E I D A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F S W E I F N S L N R E F V D P K A Y R F S F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K D P V E I K M E G S N G L T A R L P Y H P S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P E Y G V R K Y E I G D T V Y I S K G D A D K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A D G E R F R L K D L C Y V V R K G D R F L F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G T E M K E K T K I I N W C P P N S R E F Q V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K P D G S I D K G L I E P A S K G Y R G I S Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548
E R Y G Y V N F Y D S D E K A Y F T H D
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_glu_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D D E I R E R V R R E A E V A A L F N A L K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D S D A Q V G A I M G P M M G E N P E F R E H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D E I P G V V S P V I A D V N G M D R E E K R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R L G E L A P E R L E E L D A E D E E D D Q V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P D L P N A E A Y D E I R M R C A P N P N G P W
- - - - - - - - - - - - - M R C A P N P N G P W
---------------------------------------ATGCGGTGTGCGCCGAACCCGAACGGCCCGTGG
121122123124125126127128129130131132133134135136137138139140141142143144
H I G H S R M P A V I G T Y A E E Y D G E F I V
H I G H S R M P A V I G T Y A E E - - - E F I V
CACATCGGCCACTCGCGGATGCCGGCGGTCATCGGGACGTACGCCGAGGAG---------GAGTTCATCGTG
145146147148149150151152153154155156157158159160161162163164165166167168
R F D D T D P E T K R P L L W A Y D E I L D E I
R F D D T D - - - - - P . . W A Y D E I L D E I
CGCTTCGACGACACCGAC---------------CCG------TGGGCGTACGACGAGATTCTCGACGAGATA
169170171172173174175176177178179180181182183184185186187188189190191192
G Y L G F E P A D V Y R A S D R L D V Y Y E H A
G Y L . . . . A - V Y R A S D - - - - - - - - -
GGGTACCTC------------GCC---GTGTACCGCGCCAGCGAC---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R Q L I G M G G A Y T C S C P A G E F S E L K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G G E A C P H R E K D P A V V A E E F D A M V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G D Y N S G E M V L R V K T D I E H K N P A L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D W V A F R I I E T P H P R E E A A A Y R C W P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
M L D F Q S G V D D H L T G V T H I I R G I D L
M L D F Q S G V D D H - - - - - H I I R G I D L
ATGCTGGACTTCCAGTCGGGCGTCGACGACCAC---------------CACATCATCCGCGGCATCGACCTG
313314315316317318319320321322323324325326327328329330331332333334335336
Q D S A K R Q Q F V Y D Y F D W E Y P E V I H W
Q D S A K R Q Q F V Y D Y F - - - - P E V I H W
CAGGACTCCGCGAAGCGCCAGCAGTTCGTCTACGACTACTTC------------CCCGAGGTCATCCACTGG
337338339340341342343344345346347348349350351352353354355356357358359360
G H V Q V D A Y D V K M S T S T I G E L I D A G
- - - - - - - - - - K M S T S - - - - - - - - -
------------------------------AAGATGTCGACGTCC---------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E L D G W D D P R A P T L P S V Q R R G I R G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A L V D A M T E L G T S T S N V D L A M S S V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S N N R D L V D D E A P R Q F F V R D G F D D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G S G A E E Q F D A T E V P L S G G P D S A H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L V H P D H E D R G E R N I P V G D A V L V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R D L P A A G D R L W L K G Y G P V E F D G D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F D Y L D E A D I D V V R E E G V D V V H W V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A T E N V R V R M R T P N G D V S G Y A E P G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
S D V D P D A V V Q F V R V G F A R C D R H D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586
A E S V A Y Y A H P
- - - - - - - - - -
------------------------------
Class I
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_glu_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E T Q T H K I E G P V R V R F A P S P T G F L
- - - - - - - - - - - - R V R F A P S P T G F L
------------------------------------CGCGTGCGCTTCGCCCCGAGCCCGACGGGCTTTCTG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
H I G G L R T A L Y N F L F A R K H G G Q F I L
H I G G L R T A L Y N F L F A R K - - - Q F I L
CACATCGGTGGGTTGCGGACGGCGCTCTACAACTTCCTGTTTGCCCGTAAG---------CAGTTCATCCTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R I E D T D Q E R Y V P G A E E D I I E S L R W
R I E D T D - - - - - P G A E E D I I E S L R W
CGCATCGAAGATACCGAC---------------CCCGGCGCCGAGGAGGACATCATCGAATCGTTGCGCTGG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A G L T Y D E G P D V G G P C G P Y R Q S E R K
A . . . . D - - - - - - - - - G P Y R Q S E - -
GCC------------GAC---------------------------GGGCCGTACCGCCAGTCGGAG------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L Y L Q Y A K Q L V E A G H A Y Y A F D T P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E L E E M R R R L Q K S G N P S P K Y D A I T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M S M R N S L T L P A E E V E R L L A E G V P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V I R L K V P R R E T I R F Y D L I R G W V S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E S S E I D D Q V L I K S D G M P T Y H M A N V
- - - - - - - - - - - - - - - - - T Y H M A N V
---------------------------------------------------ACCTACCACATGGCCAACGTG
217218219220221222223224225226227228229230231232233234235236237238239240
V D D H L M G I T H V I R G E E W L S S T P K H
V D D H - - - - - H V I R G E E W L S S T P K H
GTCGATGACCAC---------------CACGTGATCCGGGGCGAGGAATGGCTTTCTTCGACGCCCAAGCAC
241242243244245246247248249250251252253254255256257258259260261262263264
V L L Y R Y L G W E M P Q M A H L P L I L S P K
V L L Y R Y L - - - - P Q M A H L - - - - - - -
GTGCTGCTGTACCGGTACCTG------------CCGCAGATGGCACACCTG---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G G K L S K R N A D A L G I P V L V R Q Y R E L
- - K L S K R - - - - - - - - - - - - - - - - -
------AAGCTCTCCAAGCGT---------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G Y E P E A L V N Y L A F L G W N P G T E Q E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F T L E E L I E A F S L D R V R P A A V Q F S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D K L Q W Y N Q Q F I R R M S V E E L A R K A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P Y L K K H G I E A D E A Y V R K V A A L M Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R I T F V E E L A T F C R F F Y E D P T T Y E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K G V Q K R W K A N S A E L V R A Y A D R L E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L K E F T A E T A E Q A L R E L A E E R G V K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A E I I H P T R L A I S G L S F G P S L F E M M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500
E V I G K E A C V R R L R R A A E V L G
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_glu_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A G I E G P V R V R F A P S P T G S L H I G G
- - - - - - - - R V R F A P S P T G S L H I G G
------------------------CGGGTGCGTTTTGCCCCTAGCCCAACCGGCAGCTTGCACATCGGCGGT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V R T A L F N W L C A R H Y G G Q F I L R I E D
V R T A L F N W L C A R H - - - Q F I L R I E D
GTGCGTACCGCTCTCTTCAATTGGCTCTGTGCCCGTCAT---------CAGTTTATTCTGCGGATCGAAGAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T D E K R F V P G A A D D I S I S L R W V G I D
T D - - - - - P G A A D D I S I S L R W V . . D
ACTGAC---------------CCCGGTGCTGCCGATGATATTAGCATTTCGCTGCGCTGGGTT------GAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W D E G P D V G G P Y G P Y V Q S Q R F E Q G I
- - - - - - - - - - - G P Y V Q S Q - - - - - -
---------------------------------GGCCCCTACGTGCAGTCACAG------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y R P Y V D Q L L E A G L A Y M S F T T E E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T Q M R A A A E A A G I K A F R F R G S E R D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P L E R Q R E L A A S G K P Y T V R L K T P L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G E T R F S D L I R G G D E I V V Q N D Q L Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I V L I K S S G M P V Y H F A H L V D D H L M K
- - - - - - - - - - V Y H F A H L V D D H - - -
------------------------------GTCTACCACTTTGCCCACCTCGTTGACGACCAT---------
217218219220221222223224225226227228229230231232233234235236237238239240
I T L V M R G E E W V P S T P Y H V L L Y D Y F
- - L V M R G E E W V P S T P Y H V L L Y D Y F
------CTTGTTATGCGTGGAGAAGAGTGGGTACCGAGCACACCGTACCACGTCTTACTCTACGACTACTTC
241242243244245246247248249250251252253254255256257258259260261262263264
G W Q R P I F A H L P A I L R H D G K G K L S K
- - - - P I F A H L - - - - - - - - - - K L S K
------------CCGATCTTTGCCCATCTG------------------------------AAACTGTCGAAG
265266267268269270271272273274275276277278279280281282283284285286287288
R K D D V A T Q R F R E R G Y L P E T M L N Y L
R - - - - - - - - - - - - - - - - - - - - - - -
CGC---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A L Q G W S Y D G V T E I M N R E E L I A R F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I E R I Q P S P A R W N P E K L R D M N G I Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R K L S R E Q L A E R V L P F M Q R A G L I G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P A S D T E R A Y L L Q L I P L I H E R L E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q E A P E L L E F F Y C E V T P G V T Y Q P T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L I P K K H D A V Q T V T M L R A A H D V L Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q T D W T A P A L E T A L R T L V E Q L G V K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G P L F S A I R I A V T G R S V A P P L F D T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503
A G V G R E R S L E R L A A A I A A L E Q M S
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class I
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_glu_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P A A S K P V V T R F A P S P T G E L H V G G
- - - - - - - - V T R F A P S P T G E L H V G G
------------------------GTCACCCGCTTCGCCCCCTCGCCCACGGGGGAGCTGCACGTGGGCGGG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A R T A L Y S W A L A R R H G G R F L L R F E D
A R T A L Y S W A L A R R - - - R F L L R F E D
GCCCGCACGGCGCTGTACAGCTGGGCGCTGGCCCGCCGC---------CGGTTCCTGCTGCGCTTCGAGGAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T D L A R S S A A A A D R I R A D L A W F G L D
T D - - - - - A A A A D R I R A D L A W F . . D
ACCGAC---------------GCCGCCGCCGCCGACCGCATCCGCGCCGACCTCGCCTGGTTC------GAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W D N E G G V V P R Q S E R H A A G V Y D A A V
- - - E G . . . P R Q S E - - - - - - - - - - -
---------GAAGGC---------CCCCGCCAGAGCGAG---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D T L L S A G R A Y E R D G A V L F R F G C D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A F E D A V Y G C V E T P A S D N R D F V I R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G V A G G G M P T F H L A V V V D D H D A G V T
- - - - - - - - T F H L A V V V D D H - - - - -
------------------------ACCTTCCACCTCGCCGTCGTCGTCGACGACCAC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
H V V R G Q E H L S N T P K H A A L C D A L G F
H V V R G Q E H L S N T P K H A A L C D A L - -
CACGTCGTCCGCGGCCAGGAGCACCTCAGCAACACGCCCAAGCACGCGGCGTTGTGCGACGCCCTG------
193194195196197198199200201202203204205206207208209210211212213214215216
D R P V W A H T P S I L N P G G S K M S K R D K
- - P V W A H T - - - - - - - - - K M S K R - -
------CCGGTGTGGGCGCACACG---------------------------AAGATGAGCAAGCGC------
217218219220221222223224225226227228229230231232233234235236237238239240
A K A A R L G A A E N P R Q E L V V P G V T P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A L A A F L A K D N D D T A I A T A I A A A L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L A L P A V E V A D F R R A G Y L P G V V A N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V A L L G W N P G D G R E R L S M E E I A R A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D L G R V N R A N S T F D R A K L A A F S Q D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L I A M E P A A F A A A L R D H L A A Y R A G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L A A L G L E K I D A F A A L Y Q Q R A V T L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D P A S A G R F F V E P P A A Y D A K A V K K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L T R Q D G A G L A H L A A A R D A L A G V E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F D E A R V Q A A L E A L A A E R E L P H L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I A Q P L R V A L T G T A V S P D I A A T V A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502
L G R E E V L A R I D R C V E R F S G G G G
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_glu_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T R P V R T R F A P S P T G F I H L G N I R S
- - - - - R T R F A P S P T G F I H L G N I R S
---------------CGCACCCGTTTTGCGCCGAGCCCCACCGGCTTCATCCATCTCGGCAACATCCGATCC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L Y P W A F A R K M K G T F V L R I E D T D V
A L Y P W A F A R K - - - T F V L R I E D T D -
GCGCTTTATCCGTGGGCGTTCGCCCGCAAG---------ACGTTCGTGCTGCGGATCGAGGACACCGAT---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E R S S Q E A V D A I L E G M A W L G L D Y D E
- - - - Q E A V D A I L E G M A W L . . D - - -
------------CAGGAGGCGGTCGACGCGATCCTCGAAGGGATGGCGTGGCTC------GAT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G P Y Y Q M Q R M D R Y R E V L A Q M Q E K G L
G P Y Y Q M Q - - - - - - - - - - - - - - - - -
GGCCCGTACTATCAGATGCAG---------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V Y P C Y M S T E E L D A L R E R Q R A A G E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P R Y D G T W R P E P G K V L P E P P A G V A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V L R F R N P L T G T V A W D D A V K G R V E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S N E E L D D L V V A R P D G T P M Y N F C V V
- - - - - - - - - - - - - - - - - M Y N F C V V
---------------------------------------------------ATGTACAACTTCTGCGTCGTC
193194195196197198199200201202203204205206207208209210211212213214215216
V D D L D M G I T H V I R G D D H V N N T P R Q
V D D L - - - - - H V I R G D D H V N N T P R Q
GTCGACGATCTC---------------CACGTGATCCGCGGCGACGACCACGTGAACAACACGCCGCGCCAG
217218219220221222223224225226227228229230231232233234235236237238239240
I N I L R A L G G E V P V Y A H L P T V L N E Q
I N I L R A L - - - - P V Y A H L - - - - - - -
ATCAACATCCTGCGCGCGCTC------------CCGGTGTACGCGCACTTG---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G E K M S K R H G A M S V M G Y R D A G Y L P E
- - K M S K R - - - - - - - - - - - - - - - - -
------AAGATGAGCAAGCGT---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A V L N Y L A R L G W S H G D A E I F T R E Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V E W F D L E H L G K S P A Q Y D H N K L N W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N N H Y I K E A D D A R L A G L A K P F F A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G I D A G A I E Q G P D L V S V M G L M K D R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S T V K E I A E N S A M F Y R A P A P G A D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A Q H V T D A V R P A L V E F A A A L K T V E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T K E A I A A A L K A V L G A H K L K M P Q L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
M P V R L L V A G T T H T P S I D A V L L L F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469
R D V V V S R I E A A L A
- - - - - - - - - - - - -
---------------------------------------
Class I
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_glu_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E R K V R V R F A P S P T G A L H I G G V R
- - - - - - R V R F A P S P T G A L H I G G V R
------------------GGCACGTTTCATGCGAGCCAATGTTTCTTCTTTTCCCAACACCCAGGAAATATC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T A L Y N Y L F A R Q H G G D L I F R I E D T D
T A L Y N Y L F A R Q - - - D L I F R I E D T D
GAACATATGAGGACCTTTGCCCTCACCTACCAG---------GAAAGCATTCATAATATTACCTGTATGATA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S N R F V P G A E E Y I L E S F K W L G I Q F D
- - - - - P G A E E Y I L E S F K W L . . . . D
---------------CCAGTCCATTACTATTTTTTCTTGACCTTCAATGCTGAAATC------------CAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E G V S F G G E Y G P Y R Q S E R R E I Y K K Y
- G V . . . . . . . . Y R Q S E - - - - - - - -
---CTCCGC------------------------ATCCTCTTTCCAGCG------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V Q V L L D N G K A Y I A F D T P E E L D A K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A E I A N F Q Y D A S T R V G M R N S L T L P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E E V E A L I A D G K Q Y V V R F K I E P N E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I H V N D L I R G E V V I N S S I L D D K V L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K S A D E L P T Y H L A N I V D D H L M E V S H
- - - - - - - T Y H L A N I V D D H - - - - - H
---------------------CAGCAGAGCAAGGAAATTGATAACAGCCTCGGG---------------ACG
217218219220221222223224225226227228229230231232233234235236237238239240
V I R G E E W L P S A P L H V L L Y R A F G W E
V I R G E E W L P S A P L H V L L Y R A F - - -
ATAACCGGAAGAAATCTCACCGCTCTTCGGGTCATGCCACTCAAGAGGGAATACAGGGAATCC---------
241242243244245246247248249250251252253254255256257258259260261262263264
D T M P A F A H L P L L L K P E G N G K L S K R
- - - P A F A H L - - - - - - - - - - K L S K R
---------TTTACTCAGTTTTCCATT------------------------------GGCAAAAGCCGGCAT
265266267268269270271272273274275276277278279280281282283284285286287288
D G D R L G F P V F P L E W H D P K S G E I S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G Y R E S G Y L P E A V I N F L A L L G W N P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N D Q E V M S M D E L I R L F D L H R C S K S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A K F D Y K K G I W F N H T Y I Q Q K S D K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A E L F V P V L K E H G V E A P F E K V V T V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G M M K D R V S F V K E L W E V C S F F F V A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T E Y D E K T V K K R W K E D S A K C M T E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E V L A G I E D F S I E G Q E K I V M D W I A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K G Y H T G N I M N A F R L T L V G E G K G P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M F D I S W V L G K E E T L A R M K R A V E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505
K
-
---
Class I
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_glu_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A K D V R V R Y A P S P T G H L H I G G A R T
- - - - - R V R Y A P S P T G H L H I G G A R T
---------------CGCGTGCGCTATGCGCCGAGCCCGACCGGCCATTTGCATATCGGAGGGGCGCGGACC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L F N Y L F A R H H G G K M I V R I E D T D I
A L F N Y L F A R H - - - K M I V R I E D T D -
GCGCTGTTTAACTATTTGTTTGCTCGCCAT---------AAAATGATCGTCCGCATCGAGGATACGGAT---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E R N V E G G E Q S Q L E N L Q W L G I D Y D E
- - - - E G G E Q S Q L E N L Q W L . . D - - -
------------GAAGGCGGCGAACAGTCGCAGCTCGAAAACTTACAATGGCTC------GAT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S V D K D G G Y G P Y R Q T E R L D I Y R K Y V
S V . . . . . . . . Y R Q T E - - - - - - - - -
TCCGTT------------------------TACCGCCAGACGGAG---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D E L L E Q G H A Y K C F C T P E E L E R E R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E Q R A A G I A A P Q Y S G K C R R L T P E Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A E L E A Q G K P Y T I R L K V P E G K T Y E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D D L V R G K V T F E S K D I G D W V I V K A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G I P T Y N F A V V I D D H L M E I S H V F R G
- - - T Y N F A V V I D D H - - - - - H V F R G
---------ACGTACAACTTTGCCGTCGTCATCGACGACCAC---------------CATGTGTTCCGCGGT
217218219220221222223224225226227228229230231232233234235236237238239240
E E H L S N T P K Q L M V Y E Y F G W E P P Q F
E E H L S N T P K Q L M V Y E Y F - - - - P Q F
GAGGAGCATTTGTCCAACACGCCGAAGCAGCTGATGGTGTATGAATATTTT------------CCGCAGTTT
241242243244245246247248249250251252253254255256257258259260261262263264
A H L T L I V N E Q R K K L S K R D E S I I Q F
A H L - - - - - - - - - K L S K R - - - - - - -
GCCCATTTG---------------------------AAGTTGTCCAAGCGC---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V S Q Y K E L G Y L P E A M F N F F A L L G W S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P E G E E E I F S K D E L I R I F D V S R L S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S P S M F D T K K L T W M N N Q Y I K K L D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R L V E L A L P H L V K A G R L P A D M S D E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R Q W A R D L I A L Y Q E Q M S Y G A E I V P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S E L F F K E E V E Y E D E A R Q V L A E E Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P D V L S A F L A H V R D L D P F T A D E I K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A I K A V Q K A T G Q K G K K L F M P I R A A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T G Q T H G P E L P F A I Q L L G K Q K V I E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489
L E R A L Q E K F
- - - - - - - - -
---------------------------
Class I
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_glu_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D R P T P A R T R F A P S P T G Y L H I G S
- - - - - - - - R T R F A P S P T G Y L H I G S
------------------------AGCAGCAGCAGTGCTGATTCGGGCGAGCGTCACAGCTTTACCTAAAAC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L R T V L F S W L W A R H T G G Q F L L R I E D
L R T V L F S W L W A R H - - - Q F L L R I E D
CGCCAAGGTTTCGAATAGGCCTGGCGAGGTCGTGCGCCC---------AACGCGAATAGGCATAAACACTTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T D R K R F V E G A E E Q L T S S L Q A I G L M
T D - - - - - E G A E E Q L T S S L Q A I . . .
GGGAAT---------------ATTGACAAAATCATGCAAGAGCTTGTCTAAACTGGGGGCATC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W D E G P I V G G P H A P Y K Q S E R L E I Y Q
. D - - - - - - G P . . . Y K Q S E - - - - - -
---AGC------------------TTGGCC---------AACCGTTTGCGCCGG------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A H A Q A L I D K G V A Y R S Y A T A D E I A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I N A E R E A R G E P K L L V F R N L P G I D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A A R E A A G A D Y N V R L S L K T T G Q T V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q D L V R G Q I V F D N A A L K M P D P V L L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T D G F P T Y A L A A M V D D H L M G I T H V L
- - - - - T Y A L A A M V D D H - - - - - H V L
---------------TTCAAGGGTCATAAACTCTGTTTTATCATCGTA---------------GGCCAAATA
217218219220221222223224225226227228229230231232233234235236237238239240
R A D E W I P T W P I H H Q I Y E A F G W E Q P
R A D E W I P T W P I H H Q I Y E A F - - - - P
GTTGATAATGGCTTCGGGCACAAAGCCTAAATCGATATACTCGGTGACCGATGTATC------------GGA
241242243244245246247248249250251252253254255256257258259260261262263264
V W V H V P Q V L G S D G K K L S K R H G D T S
V W V H V - - - - - - - - - K L S K R - - - - -
AAGCTTCTTGCCATC---------------------------CCAAACTGGTTGCTC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
V T E Y I D L G F V P E A I I N Y L A L I G W S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y D D K T E F M T L E E L I E R F D L N R I R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S G G V F D R D K L L H F N G V Y L R N M A P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E L A Q R V A P Y L S K A G L I S A E P T A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L A K I T E Y L P L V Q D R L K L L S E A P E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L D F F F V D P Q G Y D P A L L V P K K G D P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q T V E I L G Q V K A S F E A V E T W D A P S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D K L L H D F V N Q L G L K I P Q V F M P I R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A I S G R T T S P G L F E T L A V L G K A V T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495
A R I S T A A A A L S S A S V
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_glu_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K V K T R F A P S P T G Y L H L G N A R T A
- - - - K T R F A P S P T G Y L H L G N A R T A
------------AAAACGAGGTTCGCACCCAGTCCAACCGGATACCTACACCTCGGAAACGCAAGAACAGCC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I F S Y L F A R H N N G G F V L R I E D T D P E
I F S Y L F A R H - - - G F V L R I E D T D - -
ATATTCAGTTATCTGTTTGCAAGGCAC---------GGTTTTGTACTTCGTATAGAGGACACCGAT------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R S K K E Y E E M L I E D L K W L G I D W D E F
- - - K E Y E E M L I E D L K W L . . D - - - F
---------AAAGAGTATGAAGAAATGCTGATAGAGGATTTAAAGTGGCTC------GAT---------TTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y R Q S E R F D I Y R E Y V N K L L E S G H A Y
Y R Q S E - - - - - - - - - - - - - - - - - - -
TACAGACAGTCCGAG---------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P C F C T P E E L E K E R E E A R K K G I P Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y S G K C R H L T P E E V E K F K K E G K P F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I R F K V P E N R T V V F E D L I K G H I A I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T D D F G D F V I V R S D G S P T Y N F V V V V
- - - - - - - - - - - - - - - - T Y N F V V V V
------------------------------------------------ACTTACAACTTCGTCGTTGTTGTT
193194195196197198199200201202203204205206207208209210211212213214215216
D D A L M G I T H V I R G E D H I P N T P K Q I
D D A - - - - - H V I R G E D H I P N T P K Q I
GACGACGCC---------------CACGTGATAAGAGGAGAGGACCACATACCCAACACTCCCAAGCAAATA
217218219220221222223224225226227228229230231232233234235236237238239240
L I Y E A L G F P V P K F A H L P V I L G E D R
L I Y E A L - - - - P K F A H L - - - - - - - -
CTCATATACGAAGCTCTC------------CCCAAGTTCGCACACCTT------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S K L S K R H G A V S V R A Y R E E G Y M P E A
- K L S K R - - - - - - - - - - - - - - - - - -
---AAACTCTCAAAGAGG------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L F N Y L C L L G W S P P E E G R E I F S K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L I K I F D L K D V N D S P A V F N K E K L K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
M N G V Y I R E V L P L D V L L E R A I P F L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K A G Y D T S D R E Y I K K V L E Y T R D S F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T L S E M V D R L R P F F V D E F E I P E E L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S F L D D E K A Y Q V L S A F L E K I R E K K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E T P Q E V K K L A K E I Q K A L K V K P P Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
W K P L R I A L T G E L E G V G I D I L I A V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473
P K E K I E K R I L R V L E K L S
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_glu_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T V R T R F A P S P T G Y L H I G G V R T A L
- - - R T R F A P S P T G Y L H I G G V R T A L
---------CTTGATGGCGTTCTCAATCCGGGCGAGCACCTTGTCGCGGCCGAGGAGCACGAGTGTTTCCGG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F N W L Y A R R H E G Q F V L R I D D T D A A R
F N W L Y A R R - - - Q F V L R I D D T D - - -
CAAGCCGAAGCCGGTCGTCTCACC---------GACGCGAAGCGGGCCGTCGAGATCCCGGGG---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N R A E A V K P I L D G F D W L G M D W D E G P
- - A E A V K P I L D G F D W L . . D - - - - -
------GGTCGCGTAGCCCATGAACGCTGCCAGGATCGTCGGCGCGTC------CTC---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T K D A S G D S F G P H K P Y F Q G Q R N D K Y
- - - - - - - - - G P . . . Y F Q G Q - - - - -
---------------------------GACGCC---------GAGCTTGTCCGCGAC---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V A A A M K L M A E G K A Y P D Y T T Q A E Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S R R D L A A R L K K A Y V H R G S N R D V A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E E N L R L Y K E K P A P V L L K V P V G E T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V F E D H V R G R V E V S T D T I R D P A L L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A P N E A G V C G A L Y A F A T V V D E V D F G
- - - - - - - - - - L Y A F A T V V D E V - - -
------------------------------CGCCCAACCGAGGCGCACGAGGTAGTTCATTAG---------
217218219220221222223224225226227228229230231232233234235236237238239240
I T H V I R A E E H L A N T P V Q I L I Y N A L
- - H V I R A E E H L A N T P V Q I L I Y N A L
------ACCCAACTCGCGGTAGTACGCGACCGTTGCCAGGTTGAGATCGTCGCGCCCCTTCAGTTCCTCATC
241242243244245246247248249250251252253254255256257258259260261262263264
G G A V P E F A H V P L I Y R N G K K I S K R D
- - - - P E F A H V - - - - - - - - K I S K R -
------------CGCTTTCAGCTTGGCGAT------------------------GTCGCGCTTGCTGAT---
265266267268269270271272273274275276277278279280281282283284285286287288
L P P L S A D E I A K L K A C G W T D E E L K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R D D L N L A T V A Y Y R E L G Y I P A A L M N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y L V R L G W A L N A T D E I F P L E T A I A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F D T K D V T K A P G N F D E K K L F W V Q S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y M R K L S A E E K L V G A M P Y L L R S K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S N P I S D T T R A V L L K V A E A A A D R I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L F S E F V F Y A A P I L K D V P D Y N P K A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A D K L A K P G V A D R L R G F A D E L R A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P F D A P T I L A A F M G Y A T K V G V K P R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L D G P L R V A V T G E T T G F G L P E T L V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521
L G R D K V L A R I E N A I K M T
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_glu_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K T R I R T R Y A P S P T G Y L H I G G A R
- - - - - - R T R Y A P S P T G Y L H I G G A R
------------------TCTTTTTTGAATTATTTCTTTTCCGTATAAATAAATAGCTTTTGCAAGTTCAGG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T A L F N Y L F A K H F N G D F I V R I E D T D
T A L F N Y L F A K H - - - D F I V R I E D T D
TCCATGCTCATTAAAAGTTGTTGCTAATCTAAT---------TAATTTTTTACCATTTACATTCAAATCAGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I A R N V A G G E E S Q L D N L E W L Q I Y P D
- - - - - A G G E E S Q L D N L E W L . . . . D
---------------TGCCTTTTGAATTGAATCTACGCTGAAATTTTCAAAGTTTAA------------TTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E S P K N P N E K Y G K Y R Q S E K L D R Y N E
- S P . . . . . . . . . Y R Q S E - - - - - - -
---TACAAC---------------------------AATCATTGGATTTTC---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I V E I L L K K G L A Y K A Y D T T Y E L E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R A E Q I A K G I F S F R Y D R N W L K I S D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E I K K R E V E Q T Y S I R I A L P K N H D Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
W N D L V R G L I K V N S E D I G D W V I I K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D K Y P T Y N F A V V V D D F D M Q I S H V L R
- - - - T Y N F A V V V D D F - - - - - H V L R
------------ATAATTAGAAATAAATTGTTTTACTGAATCATC---------------TACGCCTTTTGA
217218219220221222223224225226227228229230231232233234235236237238239240
G E E H I T N T P K Q L A V Y E A M G W D K P V
G E E H I T N T P K Q L A V Y E A M - - - - P V
ATTTGTAATTAAAGTTAGATGTCCAAAAACAGGTTTATCTCATCCCATAGCTTC------------TTGTTT
241242243244245246247248249250251252253254255256257258259260261262263264
F G H L T L I T N S K G V K L S K R D D S V K Q
F G H L - - - - - - - - - K L S K R - - - - - -
TGGGGTATTTGT---------------------------AGAAATTTGCATATC------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F I S N Y K E D G Y V S W A I S N Y L A L L G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T S K D T K E I M T K E E L I E K F D P E R L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A S P S K F D M K K M N W Y G K H Y L Q E I N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N E I F E Y L E S L K D K K W L D L F I E T F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P N A F S L S E L K R E L K E Y E N P M I E K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I E I N D V V K K F K Q N L N F E N F S V D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I Q K A I D K T G T D L N V N G K K L F L P I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L A T T F N E H G P E L A K A I Y L Y G K E I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464
Q K R L G N V N
- - - - - - - -
------------------------
Class I
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_glu_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G N E V R V R Y A P S P T G H L H I G N A R T
- - - - - R V R Y A P S P T G H L H I G N A R T
---------------CGGGTTCGTTATGCGCCGAGCCCAACAGGCCATTTACATATCGGAAATGCCAGAACC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L F N Y L F A R S Q G G K F I I R I E D T D R
A L F N Y L F A R S - - - K F I I R I E D T D -
GCTCTTTTTAATTATTTGTTTGCCCGGAGC---------AAATTCATCATCCGCATTGAAGATACGGAC---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K R N I E G G E Q S Q L N Y L K W L G I D W D E
- - - - E G G E Q S Q L N Y L K W L . . D - - -
------------GAAGGCGGGGAGCAAAGCCAGCTGAACTATTTAAAATGGCTG------GAC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S V D V G G E Y G P Y R Q S E R N D I Y K T Y Y
S V . . . . . . . . Y R Q S E - - - - - - - - -
AGCGTG------------------------TACCGCCAATCCGAA---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E L L E K G L A Y K C Y C T E E E L E K E R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E Q A A R G E M P R Y S G K C R N L T K E E Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K L E A E G R Q P S I R F K V P Q G E V I S F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D I V K G E I S F E T D G I G D F V I V K K D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T P T Y N F A V A V D D Y L M K M T H V L R G E
- - T Y N F A V A V D D Y - - - - - H V L R G E
------ACTTACAACTTTGCCGTAGCGGTCGATGACTAT---------------CATGTCCTGCGCGGCGAA
217218219220221222223224225226227228229230231232233234235236237238239240
D H I S N T P K Q I M I Y N A L G W D I P A F G
D H I S N T P K Q I M I Y N A L - - - - P A F G
GACCACATTTCCAATACGCCAAAGCAGATCATGATTTACAACGCCCTT------------CCGGCATTTGGA
241242243244245246247248249250251252253254255256257258259260261262263264
H M T L I V N E N R K K L S K R D E S I I Q F I
H M - - - - - - - - - K L S K R - - - - - - - -
CATATG---------------------------AAACTGAGCAAACGT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E Q Y E E L G Y L P E A L F N F I T L L G W S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V G E E E L F T K E Q F I E I F D V H R L S K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P A V F D T H K L K W V N N Q Y V K K L D L D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V I E L T V P H L Q K A G K V S E E L T G S E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E W V R K L I S L Y Q E Q L S Y G A E I V E L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E L F F K D D I Q Y N R E A R T V L E E E Q V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E V L R V F A E T L E Q L D S F T A D E I K A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I K A V Q K E T G H K G K K L F M P I R V A T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G Q T H G P E L P Q S I E L L G K D T V L K R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485
N N I I Q
- - - - -
---------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_glu_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T R V R Y A P S P T G L Q H I G G I R T A L
- - - R V R Y A P S P T G L Q H I G G I R T A L
---------TATTCTTAAAAATTCCTGTGCTAATTTTATTCTTTCAAAAACTTTAGACTTGCCTATCAATTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F N Y F F A K S C G G K F L L R I E D T D Q S R
F N Y F F A K S - - - K F L L R I E D T D - - -
TAAAGAATCAAAAAGCGGCGGAGA---------ACCAAGCGCTGCAATTCTAATAGGAAGAAG---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y S P E A E N D L Y S S L K W L G I S F D E G P
- - P E A E N D L Y S S L K W L . . . . D - - -
------AAAACCATTACTCTCAGCAAAATCATAAAAAATTTTATCATT------------TCT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V V G G D Y A P Y V Q S Q R S A I Y K Q Y A K Y
- - - G . . . P Y V Q S Q - - - - - - - - - - -
---------AAT---------TAATTCTAAAATAGAACA---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L I E S G H A Y Y C Y C S P E R L E R I K K I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N I N K M P P G Y D R H C R N L S N E E V E N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L I K K I K P V V R F K I P L E G D T S F D D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L G R I T W A N K D I S P D P V I L K S D G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P T Y H L A N V V D D Y L M K I T H V L R A Q E
- T Y H L A N V V D D Y - - - - - H V L R A Q E
---CTCAAGATCATTTTTTGAAAAAAATTCTCTCTT---------------GCCAAGCAAAGTAACATAATT
217218219220221222223224225226227228229230231232233234235236237238239240
W V S S G P L H V L L Y K A F K W K P P I Y C H
W V S S G P L H V L L Y K A F - - - - P I Y C H
AATAATAGCCTCTGGAAGATACCCATCTTCAATAAACTGTCTTAA------------ATGTCTTTTGCTTAA
241242243244245246247248249250251252253254255256257258259260261262263264
L P M V M G N D G Q K L S K R H G S T A L R Q F
L - - - - - - - - - K L S K R - - - - - - - - -
TTT---------------------------AAGGTGACAATAAAT---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I E D G Y L P E A I I N Y V T L L G W S Y D D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R E F F S K N D L E Q F F S I E K I N K S P A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F D Y H K L D F F N S Y Y I R E K K D E D L F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L L L P F F Q K K G Y V S K P S T L E E N Q K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K L L I P L I K S R I K K L S D A L N M T K F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y E D I K S W N L D E F L S R K K T A K E V C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I L E L I K P I L E G F E K R S S E E N D K I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y D F A E S N G F K L G E I L L P I R I A A L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S K V S P P L F D S L K L I G K S K V F E R I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490
L A Q E F L R I N E
- - - - - - - - - -
------------------------------
Class I
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_glu_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D R I R V R Y A P S P T G Y L H I G N A R T
- - - - - R V R Y A P S P T G Y L H I G N A R T
---------------AGAGTAAGATATGCACCAAGTCCAACTGGTTATCTTCATATTGGTAATGCAAGAACA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L F N Y L Y A K H Y N G D F V I R I E D T D K
A L F N Y L Y A K H - - - D F V I R I E D T D -
GCATTATTCAATTACTTGTATGCTAAACAT---------GATTTTGTGATTCGAATTGAAGATACTGAT---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K R N L E D G E T S Q F D N L K W L G L D W D E
- - - - E D G E T S Q F D N L K W L . . D - - -
------------GAAGATGGAGAAACATCACAATTTGATAATCTTAAATGGTTA------GAT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S V D K D N G Y G P Y R Q S E R Q H I Y Q P L I
S V . . . . . . . . Y R Q S E - - - - - - - - -
TCTGTA------------------------TATCGTCAATCTGAA---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D Q L L A E D K A Y K C Y M T E E E L E A E R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A Q I A R G E M P R Y G G Q H A H L T E E Q R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q F E A E G R Q P S I R F R V P Q N Q T Y S F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D M V K G N I S F D S N G I G D W V I V K K D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I P T Y N F A V A I D D H Y M E I S D V I R G D
- - T Y N F A V A I D D H - - - - - D V I R G D
------ACGTACAATTTTGCAGTAGCTATAGATGATCAT---------------GATGTCATTCGTGGTGAT
217218219220221222223224225226227228229230231232233234235236237238239240
D H I S N T P K Q I M I Y E A F G W E P P R F G
D H I S N T P K Q I M I Y E A F - - - - P R F G
GATCATATTTCAAACACGCCTAAACAAATTATGATTTATGAAGCATTT------------CCTCGTTTTGGT
241242243244245246247248249250251252253254255256257258259260261262263264
H M S L I V N E E R K K L S K R D G Q I L Q F I
H M - - - - - - - - - K L S K R - - - - - - - -
CATATG---------------------------AAGTTAAGTAAACGT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E Q Y R D L G Y L P E A L F N F I A L L G W S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E G E E E I F S K E E F I K I F D E K R L S K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P A F F D K Q K L A W V N N Q Y M K Q K D T E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V F Q L A L P H L I K A N L I P E V P S E E D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S W G R K L I A L Y Q K E M S Y A G E I V P L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E M F F K E M P A L G E E E Q Q V I N G E Q V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E L M T H L F S K L E A L E P F E A A E I K K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I K E V Q K E T G I K G K Q L F M P I R V A V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G Q M H G P E L P N T I E V L G K E K V L N R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484
K Q Y K
- - - -
------------
Class I
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_glu_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T N N K T K S D N K S K T G Q Y E G K L P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A I Q G Q V V T R F P P E P S G Y L H I G H A K
- - - - - - V T R F P P E P S G Y L H I G H A K
------------------TATAATAGGTTCTTCTGGCTTATCAGAACAGAATGGTTTATCTACAATAAAGTA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A A L L N Y Y Y A N K Y E G K L L L R F D D T N
A A L L N Y Y Y A N K - - - K L L L R F D D T N
ACCTCTTCTTTCAAGTTGAAGTCTATCTCCAGA---------TTTAATTAGTGGATCACAAAATGCAGGTGT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P V L E N E E F Q E S I E A D L K I L G I T P F
- - - - - E E F Q E S I E A D L K I L . . . . F
---------------AGTATTGACAAGGTCCTGAATTTCATCACCATCTTCTGGCTT------------TAA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N V S F T S D H F D T I M N Y C E E M F K L G K
N V S F T S D - - - - - - - - - - - - - - - - -
ATGGTCGTATTCTCTTAGAAT---------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A Y V D D T C V E V M R E E R G K G I E S K N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N N S V D E N L R L W K E M I D G T E H G L K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
C V R A K I D M Q C K N K C M R D P V L Y R C V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L T P H H R T G T K Y K V Y P T Y D F A C P I V
- - - - - - - - - - - - - - - T Y D F A C P I V
---------------------------------------------TAAAGCTACGGCATCTTGCCCAACAGC
217218219220221222223224225226227228229230231232233234235236237238239240
D S I E G V T H A L R T N E Y S D R I E Q Y N W
D S - - - - - H A L R T N E Y S D R I E Q Y N W
AAAGAA---------------ATCCATAAGTTGTTTGTTAATAGTCCAGAGTTTATCCCATTCCATAAGATT
241242243244245246247248249250251252253254255256257258259260261262263264
V I N A L G L R P V E I Y E F S R L N F V N T V
V I N A L - - - - V E I Y E F - - - - - - - - V
GGAATTTTTAGATGG------------GACGAATTGTAATAAAGC------------------------AAT
265266267268269270271272273274275276277278279280281282283284285286287288
L S K R K L T W I V N N G L V E G W D D P R F P
L S K R - - - - - - - - - - - - - - - - - - - -
TCCTCTAACAGT------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T V R G I V R R G L S P S A L L Q F V T E Q G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S K N S N L M E W D K L W T I N K Q L M D P V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P R F F A V G Q D A V A L N L S E A P E E P L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N Q R D L H Q K N P D L G K G Q I V M Y K S I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I D R D D A T Q I L S G E E I T L M K W G N A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I Q D I S Q I D K Q P T G I F E G K L N L E G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F R S T K K K I H W L A N L P S V L T K C I L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E Y D H L I N K R K P E D G D E I Q D L V N T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S L F E T P A F C D P L I K D L K S G D R L Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E R R G Y F I V D K P F C S D K P E E P I I L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K I P D G K S K A S S T I S S K V D A Q K L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555
G K N
- - -
---------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_glu_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R R F L P M H M L V N I H L K A L T L S N T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F T T A P Q R E E N E K L Q L S N A E K G K V V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T R F P P E A S G F L H I G H A K A A L I N R M
T R F P P E A S G F L H I G H A K A A L I N R M
ACCCGCTTCCCCCCAGAGGCTAGCGGGTTCCTGCATATCGGCCATGCGAAAGCTGCGCTGATCAACCGCATG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L A D A Y E G K M L F R F D D T N P S K E K E H
L A D A - - - K M L F R F D D T N - - - - - E H
CTGGCGGACGCG---------AAGATGCTTTTCCGCTTCGATGACACAAAT---------------GAGCAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F E V A I E E D L K T L G V R Y D F G P T Y S S
F E V A I E E D L K T L . . . . D - G P T Y S S
TTTGAGGTTGCCATCGAGGAGGATCTCAAGACACTA------------GAT---GGGCCAACATACTCGTCG
121122123124125126127128129130131132133134135136137138139140141142143144
D Y F D L M F E K A E D M I K R G L A Y C D K T
D - - - - - - - - - - - - - - - - - - - - - - -
GAC---------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P R E E M Q K C R F N G I P T K Y R D A S V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N M R L W R E M K K G T E E G Q I T C L R A K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S I D D P N K A M R D P V M Y R V S M T P H A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H G T K Q V A Y P T Y D F C C P L V D S V E G V
- - - - - - - - - T Y D F C C P L V D S - - - -
---------------------------ACCTATGACTTCTGCTGTCCTCTTGTCGACTCG------------
241242243244245246247248249250251252253254255256257258259260261262263264
T H A L R T N E Y H D R N A Q Y Y W F C D A M G
- H A L R T N E Y H D R N A Q Y Y W F C D A M -
---CATGCTCTTCGCACAAATGAGTATCACGACCGCAATGCCCAGTACTACTGGTTTTGCGACGCTATG---
265266267268269270271272273274275276277278279280281282283284285286287288
I R K P T I E D F S R L N M E Y S V M S K R M L
- - - P T I E D F - - - - - - - - V M S K R - -
---------CCGACCATTGAGGACTTC------------------------GTAATGTCAAAGCGA------
289290291292293294295296297298299300301302303304305306307308309310311312
T K L V D T H V V D G W D D P R L P T V R A L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R R G M Q I E A L R Q F V A E Q G M S K S V N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
M E W S K I W Y F N A Q I L D P T S P R Y T V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S N T L K V R C T V E G Q R H M E A E K K P L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K K D S S M G E K T Y Y K S D I I F L D A E D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V L I K D G D E V T L M D W G N A Y V K D I K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P S A D A L P T E A T I V L H P E G D V K K T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F K L T W V P E S D K A V I L T L N E Y D N L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T K K K P D P E E S I D D I I A P V S R Y S Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V I G E E A L S V V K K G D I V Q L E R R G Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I V D D D K A E K K V L I S I P D G R D K V N H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L S A K A Q Y L K T L P K K A S A A D E L A A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594
R A A K A A K K A A Q K A A A K S S
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_glu_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E N K N K K L I F V N F L F S K K H G M A V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N A I N F R E I C S L L D I S E S Y K C T I N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F L D N V E K C T D K H Y N D A L N L L D T F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S N E V K S N S L V N D L I F C I I N S N F D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K V F K S N K L R L E N L Q I V Y E S A F N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N K P F L K E F S A K D K I N K E V K K N L Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T P A V T R F A P E P S G C L H I G H L K A L L
- - - V T R F A P E P S G C L H I G H L K A L L
---------CAATGATGTATTTTTCTTGTTTAAAGGAATATTTTTAGTGTATTTTAATCCTTCAAAGTTAGT
169170171172173174175176177178179180181182183184185186187188189190191192
V N Y N L A E K S N G T L L L R F D D T N P V K
V N Y N L A E K - - - T L L L R F D D T N - - -
GATAAACACTCTAATACAGTTTAT---------TGCCATGAATCTTGGACTAAGCGGATCAAT---------
193194195196197198199200201202203204205206207208209210211212213214215216
N Y E K Y E K E I L R D L D T L G I T G L K I S
- - E K Y E K E I L R D L D T L . . . . L K I S
------AGCCCATATTTTATCCCACGATATAACATTAGTTTTATTAGA------------ATTAATATAATC
217218219220221222223224225226227228229230231232233234235236237238239240
H S S D Y F E L L V D E A V S L I N K N L A Y V
H S S D - - - - - - - - - - - - - - - - - - - -
TTTAAGAGCTGT------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D N T D Q E T M R I E R F E G I E S K M R N I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N S E S L K I F K E L L Q G R A P G Y C L R A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I D M S N P N K S M R D P V I Y R A S D K M H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R C K L Y K A F P T Y D F V C P I V D S I E G V
- - - - - - - - - T Y D F V C P I V D S - - - -
---------------------------GCATCTTCCATGCATTTTATCACTAGCCCTATA------------
337338339340341342343344345346347348349350351352353354355356357358359360
T V V C R A N E Y K D R N E Q Y K W F L E N L K
- V V C R A N E Y K D R N E Q Y K W F L E N L -
---CATCGATTTATTGGGATTAGACATATCAATCTTAGCTCTAAGACAGTATCCTGGCGCACGGCCTTG---
361362363364365366367368369370371372373374375376377378379380381382383384
L E N K P E F N D F S K L N L E D T V L S K R K
- - - - P E F N D F - - - - - - - - V L S K R -
------------AATTTTAAGACTTTCGGA------------------------TTCTATTCCTTCAAA---
385386387388389390391392393394395396397398399400401402403404405406407408
I D K L I S D S L V T G W D D P R L A T I Q G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K R L G M H M T A L K D Y I N L Q G A S N K T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V I S W D K I W A M N K K V I D P L S P R F M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V E K I N C I R V F I T N F E G L K Y T K N I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L N K K N T S L G S K D V L F S D T L L F S Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D G F V L K E N E E F T L M N W G N A I V E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V V E N S I V T E L Y I K L H L E G D Y K S T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
N K I S W V S E S G A V T A T G I E Y G N L L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N E E F N I N S K I D K Q Y Y V E S S I T N L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T D M K H V Q F E R I G F F Y C D S P C V F H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634
V P F T K Q K R T Y
- - - - - - - - - -
------------------------------
Class I
Eukaryotes/Trichomonas vaginalis/amino acid sequences/Tvaginalis_glu_aa
Eukaryotes/Trichomonas vaginalis/nucleotide sequences/Tvaginalis_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D I K L R F A P S P T G Y L H I G G L R T A
- - - - K L R F A P S P T G Y L H I G G L R T A
------------AAATTAAGATTTGCACCATCACCAACAGGTTACCTCCACATAGGAGGTTTGAGAACAGCT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L Y N Y L F A K K N G G K F V L R I E D T D R T
L Y N Y L F A K K - - - K F V L R I E D T D - -
CTTTACAATTACTTATTCGCAAAAAAA---------AAATTTGTATTGAGAATCGAAGATACAGAT------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R Y V E G A I E N L I E S L E W A G I T H D E G
- - - E G A I E N L I E S L E W A . . . . D - -
---------GAAGGTGCCATAGAAAACCTAATTGAGTCCCTTGAATGGGCA------------GAC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V V V K D G N L T E V G N C G P Y I Q S Q R L D
- - - - - G . . . . V . . . . . Y I Q S Q - - -
---------------GGT------------GTT---------------TACATCCAATCACAA---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I Y K K Y V D K L I E D G H A Y Y C F C S K D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L D H L R E E Q R I K G K V P K Y D G L C R G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P L E E A K K R V A A G E D Y V V R L K L P K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K D I T F N D A V R G K V T I N T D E I D D Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L M K S D G F P T Y H M A V I V D D H L M G I T
- - - - - - - - T Y H M A V I V D D H - - - - -
------------------------ACTTACCACATGGCTGTAATAGTTGATGACCAC---------------
217218219220221222223224225226227228229230231232233234235236237238239240
H I V R G E E W L P S T P K H V Y L Y E C L G W
H I V R G E E W L P S T P K H V Y L Y E C L - -
CACATTGTAAGAGGGGAAGAATGGCTTCCATCAACTCCAAAACACGTTTATCTTTATGAATGTCTT------
241242243244245246247248249250251252253254255256257258259260261262263264
Q P P E F V H L P T V L N K D R K K L S K R Q G
- - P E F V H L - - - - - - - - - K L S K R - -
------CCAGAATTTGTCCACCTT---------------------------AAGCTTTCTAAGAGA------
265266267268269270271272273274275276277278279280281282283284285286287288
D V S V E D F K K R G Y L P E G L V N Y L A L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G W S P E D G E E I M S L D E L V E K F S F D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V G K S G G I F D T D K L N W V N S H Y M K S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D L E K L S E L A I P F V T E S G L L N E E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R N N F E W Y K I L I E T V R E A C D K L E D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P R H I E F L F G D I E I T E D Q A K E E L A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E H V P G L L D S F I K I V K S H D E I E M E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A K G L M K E V Q K D S G V K G K Q L Y M P V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A A I S G N V H G P E M Q N I L Y L L G K D K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491
I E R A E K I K D L L
- - - - - - - - - - -
---------------------------------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_glu_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_glu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V R V R L A P S P T G T L H I G T A R T A L F
- - R V R L A P S P T G T L H I G T A R T A L F
------CGGGTACGATTAGCTCCTAGTCCAACTGGAACACTTCACATAGGAACTGCACGTACTGCATTATTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N W L F A R Q Q G G A F L L R I E D T D R E R S
N W L F A R Q - - - A F L L R I E D T D - - - -
AATTGGTTGTTTGCACGTCAA---------GCATTTCTTCTGCGTATTGAGGACACTGAT------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S E E F T D N I L E G L Q W I G L D W D E D P V
- E E F T D N I L E G L Q W I . . D - - - D P V
---GAAGAATTCACTGATAATATTTTAGAAGGACTTCAATGGATT------GAC---------GATCCAGTA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I Q S H R L E A H K A A I Q Q L L A N G K A Y R
I Q S H - - - - - - - - - - - - - - - - - - - -
ATTCAAAGTCAT------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C Y A S T T E L E N M R S L Q K A E N N A P R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D N R H R N L T R S Q E Q S L I S E G R E A V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R F R I D D N E I I E W N D L I R G P M L W R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S D L G G D M V I A R Q A P A N Q I G D P L Y N
- - - - - - - - - - - - - - - - - - - - - L Y N
---------------------------------------------------------------CTTTACAAT
193194195196197198199200201202203204205206207208209210211212213214215216
L A V V V D D A T M A I S H V I R G E D H I A N
L A V V V D D A - - - - - H V I R G E D H I A N
CTAGCAGTAGTTGTAGATGATGCA---------------CATGTAATACGTGGTGAAGATCATATTGCTAAC
217218219220221222223224225226227228229230231232233234235236237238239240
T A K Q L Q L Y K A L N L P V P Q F A H T P L I
T A K Q L Q L Y K A L - - - - P Q F A H T - - -
ACTGCCAAACAATTGCAACTTTATAAAGCTTTA------------CCACAATTTGCCCACACA---------
241242243244245246247248249250251252253254255256257258259260261262263264
L N K E N R K L S K R D G V T S I N D F R N M G
- - - - - - K L S K R - - - - - - - - - - - - -
------------------AAATTATCTAAACGT---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y S S S S L A N Y M T L L G W S P P K G M S E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F S S K E A A T V F T L S R V N K A G A R F D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D K L N W L N S Q T L H E L D L R E L R E Q L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P L W I N R G W I E N S I P E T K G K I S E Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L T W Q I D L C E L L K P S L V L L S D G V D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A I P F F Q C P D I E E K A W S Q I K T A S N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L A L R E L L N V L I N K G W D G Q E I S I A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E I L K F T C Q A T D T K K G I L M K S L R S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L L G S I Q G P D L L T S W S L L A R I G K D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489
K R I R R C I L N
- - - - - - - - -
---------------------------
Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_ile_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T W D E R K D A P I F A F L E G P P T A N G F
- - - - - - - - - - - - A F L E . P P T A N G F
------------------------------------GCGTTCCTCGAG---CCGCCCACCGCTAACGGCTTC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M H V G H A R G R T L K D V K L R Y A R M R G Y
M H V G H A R G R T L K D V K L R Y - - - - - -
ATGCACGTTGGTCACGCCCGGGGCAGGACGCTGAAGGACGTGAAGCTCCGCTAT------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R V W D Q A G W D T Q G L P V E L E V E K R L G
- - W D Q A G W D T Q G - - - - - - - - - - - -
------TGGGACCAGGCCGGCTGGGACACCCAGGGG------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L R S K K E I E E Y G V E R F I E E C K K L V D
- - - - - - - - - - - - - - - - - - - - - - - D
---------------------------------------------------------------------GAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y Y L G H W E R A S K R L G L W L D Y Q H A Y Q
Y Y L G H W E R A S K R L . . . . D - - H A Y Q
TACTACCTCGGGCACTGGGAGCGGGCGAGCAAGCGGCTA------------GAC------CACGCCTACCAG
121122123124125126127128129130131132133134135136137138139140141142143144
T R D P R Y I E A I W E F V K R A H E K G L L Y
T R D - - - - - - - - - - - - - - - - - - - - -
ACAAGGGAT---------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E G R R V V P R C P R C G T A L S S H E L A Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y E E V D D P S V Y F K L P L E G L E N T Y L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A W T T T P W T I I A N E A A V V H P E E W Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F I A V G D E V W I L A E K R L E A F A K E V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L E N Y T V I N R V T G S S L V G M R Y R H P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L E E V P Y H Q R H E P P Y H T V L A A D W V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
M E D G T G V V H A A P A H G P E D F E L G Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H G L E A Y T P L R E D G V F G E E A G A F K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L W F E D A S R K V V E V L K E K G L L V H A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V V R H E Y P F C W R C G T R L F Y Y A S R Q W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F I R L T D E L K R K M A E E V Y S M R W A P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W A V K R M G D W V E N A R D W C I S R E R Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G T P L P V W R C T G C G H I V V V G S L E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R K L A V D P E S V P E D P H R P H I D R V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R C P E C G G V M K R E P F V V D V W M D S G V
- - - - - - - - - - - - - - - - D V W M D S G V
------------------------------------------------GACGTGTGGATGGACAGCGGCGTA
505506507508509510511512513514515516517518519520521522523524525526527528
A H T A A L R Q Y G W L S L W D K L Y P Y T W I
A H T - - - - - - - - - - - - - - - - - - - W I
GCGCACACT---------------------------------------------------------TGGATA
529530531532533534535536537538539540541542543544545546547548549550551552
T E A A D Q T R G W F Y T L L V T G V V W H G R
T E A A D Q T R G . F Y T L L V T G V V W - - -
ACCGAGGCCGCCGACCAGACCCGTGGC---TTCTACACGCTACTCGTGACGGGCGTAGTCTGG---------
553554555556557558559560561562563564565566567568569570571572573574575576
A P Y R S V L L Q G H V L D K H G K K M S K S K
- - Y . S V L L Q - - - - - - - - - K M S K S -
------TAC---AGCGTGCTGCTCCAG---------------------------AAGATGAGCAAGAGT---
577578579580581582583584585586587588589590591592593594595596597598599600
G N V I W A M D W M E K N G T D P M R I F L L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R A P W D S I N F D P D E V K R Y Q G Y L N I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
W N T V K F A D T Y M E L D Q W K P K P P T E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
R L Q A E D R W I L Y R L H E A L R R V E E A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E S D N M H Q A V Q A L V D L V V E Q L S H R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
I P L I R P R V W E E E A T E S K D A A Y A T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Y Y V L K A T L A A M A P V V P F L S E Y L Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A F I R K Y E P D A P E S V H M L Q W P Q V P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E L L D E E S Y R A V E E A L D A A E K V L A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
R S E R R L K R R W P L R R A A V A A K P G T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L S P S R L Q E A A D V L A R F A N I K T V E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V E G A P E W A A G A E K L E T D S M V V Y V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
M E L D E E T M L E G L A R E V I R R A Q V L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
K E L D L P V D H T A K R L I V Y A A G R L R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
A V E R H M E L I A R E V R V E R V E L A A E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956
P A E G K R W R I E E D E L V V A L E P
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_ile_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q A Q R Y R L I E Q G N T I M D I D N E I L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y W N D H A I N E K I F K K E G T K K F V F L E
- - - - - - - - - - - - - - - - - - - - V F L E
------------------------------------------------------------GTCTTTCTTGAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G P P T A N G R P H I G H A M T R T I K D I V L
. P P T A N G R P H I G H A M T R T I K D I V L
---CCGCCAACAGCTAACGGAAGACCTCACATAGGGCACGCAATGACGAGAACGATCAAGGATATAGTCCTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R Y N T M T G H K I Y R R Y G G W D C H G L P V
R Y - - - - - - - - Y R R Y G . W D C H G - - -
CGGTAT------------------------TACAGGCGTTATGGA---TGGGACTGCCACGGT---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L E A E K Y F G F K T K S D I I N Y G V E K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N S Y C R D S V F R Y I D E W K T V D Q I I G F
- - - - - - - - F R Y I D E W K T V D Q I I . .
------------------------TTTAGGTACATAGATGAGTGGAAAACCGTAGACCAGATCATC------
145146147148149150151152153154155156157158159160161162163164165166167168
S I D H S G D Y I T L R N E Y I E S E W Y V L K
. . D - - G D Y I T L R - - - - - - - - - - - -
------GAC------GGCGACTACATAACGTTGAGG------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y I Y E N G L L Y K D Y T V V P Y C P R C E T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L S S H E V A Q G Y K D V K D P S V Y V R F K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K G S E N T Y F V A W T T T P W T L P S N E F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V V N P D I E Y S L I E Y N N A K Y Y V A S S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A Q Y I F K D F K V L K K M K G F E L A G K G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E Q L L P F L D P P A G A L R V V T G D F V T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I D G S G I V H A A P A F G S D D Y Q I G K R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N V P I L N P V D K N G R F S D E R L P W Y G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K V R E A N E D I I V Y L K N N G L L I K S E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y E H S Y P F C Y R C D T P L L Y Y P L D A W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I R V S S V R D K L V E N N E K I R W K P D Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K H G R F G N F L D E A K D W N L S R D R F W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T P L P V W R C R N N H V R F I G S R K E I E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M G A T V P Q D L H R P Y I D E V K F V C P D C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G E E M R R E P Y V I D T W F D S G S A T Y A A
- - - - - - - - - - - D T W F D S G S A T Y - -
---------------------------------GATACGTGGTTCGATTCAGGAAGCGCTACATAC------
529530531532533534535536537538539540541542543544545546547548549550551552
M H Y P F E D N F D P S S D L P V S F I T E A I
- - - - - - - - - - - - - - - - - - F I T E A I
------------------------------------------------------TTCATAACTGAGGCCATC
553554555556557558559560561562563564565566567568569570571572573574575576
D Q T R G W F Y V L H V I S T I M F N K N A Y D
D Q T R G . F Y V L H V I S T I M - - - - - Y .
GACCAGACCAGGGGG---TTTTACGTTTTGCACGTAATTTCAACCATAATG---------------TAT---
577578579580581582583584585586587588589590591592593594595596597598599600
S A L S I S F I L D E Q G R K M S K S K G N S V
S A L S I - - - - - - - - - K M S K S - - - - -
AGCGCATTGTCTATA---------------------------AAGATGAGCAAAAGC---------------
601602603604605606607608609610611612613614615616617618619620621622623624
F A L D Y L K Q V A P D S L R L F F L Y G A P W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K S K N L D R K I I D E V S R R V I S T L L N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y S F F A Y N A N I D G F E F K G I L E A K D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L D K W L I S K I N T F I I E S R R A Y D D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
F H E V V R L S M D F V D N L S N F Y L R L S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R R F W A E D V T E D K L A A Y S T L Y T A I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
T C S K V L A P I V P F V S D Y L Y L S L H G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
Y E S I H L D S F P E P D T S K I D H D L E K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
M D Q A Y S V I E T V R R I R Q E I N I K G R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
P V K E I L L S G N I D P E I I P V V S Q E V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A K E I R I V S S E Q R P L K Y T V D L K M E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
A A P I L R S S V N S V R E A L K S I D G K A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
F D A V Q N G G K L R V L D H E L T G E M L N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
S T I P D P D Y G Y S R D E K N G I D V F V N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
R I D R N E Y L E G L A R E I V R R I Q L M R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
E M N L D Y T D R I N V W I D P V G D F S D A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
D K F E S Y I K A E T Q C D S L N V G H T D D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
R K W E I G D E T I G I R I E K V V P K
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_ile_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T S K F D P L K F E E E V L K Y W D D N K I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K K L K E I N E K N H K K F L F I D G P P Y P S
- - - - - - - - - - - - - - L F I D . P P Y P S
------------------------------------------AGTTTCATTCTT---ATATTGCTCCCACTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S P I P H I G T V W N K T I K D C I L R Y E R L
S . I P H I G T V W N K T I K D C I L R Y - - -
CTT---TAGATCTACTTTATCATTAGGCGCTCTTATAGACAATAATATGTATTCATTTACATT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M G Y S V K D Q P G Y D T H G L P I E V E T E K
- - - - - K D Q P G Y D T H G - - - - - - - - -
---------------TTGAATCCTTCTTATTAGATCCCTTATTAT---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R L G I K S K A E I I E K I G V D N F I S K C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E F A I N N S K S L T Q N F R N L G I F M D W E
- - - I N N S K S L T Q N F R N L . . . . D - -
---------CGATATATCAAGTCTGAGATTTTCGGAATCAACATTAAATTC------------ACT------
145146147148149150151152153154155156157158159160161162163164165166167168
N P Y F T F N N D Y I S N S W A V I K K A Y E R
N P Y F T F N - - - - - - - - - - - - - - - - -
ATCTTGTGCAACTTTATCAGA---------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G L L Y K G V H V L H W C S R C E T T L A D Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V S E Y R D L E D P S I Y V K F R V K G E P N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y L V I W T T T P W T L P A N V F V M V N K D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E Y A D V R V G D E I L V I A K D R V K E L M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E A R I K E Y K I L R V Y K G E E L I G L E Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H P L A D I V N A Q S K I N N H H K V L D G G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A V T L Q E G T G L V H S A P G H G D I D F E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G K K Y D M P V V M L V N D K G E F T Q D S G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y A G K Y V R S A S E E I I S D L K Q R N A L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y A S K I V H R Y P V C W R C K T P L I L R A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E Q W F I A V S K L K D N L M G E I D R V R W I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P D W G K T R I G N M V K E V R D W V I S R Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F W G I P L P I W V C S N C E N I I V V G G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E L N K I S I N Q V P Q D L H R P W I D S V V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R C E K C G G E A R R I S D V A D V W F D S G V
- - - - - - - - - - - - - - - - D V W F D S G V
------------------------------------------------GAAGAATGCTACACCGCTGTCAAA
529530531532533534535536537538539540541542543544545546547548549550551552
A F F A S L G K D W R K K W S E L G P V D L V L
A F F - - - - - - - - - - - - - - - - - - L V L
CCATACATC------------------------------------------------------TACGCTATC
553554555556557558559560561562563564565566567568569570571572573574575576
E G H D Q L R G W F F S L L R T G V I L M D R A
E G H D Q L R G . F F S L L R T G V I L - - - -
TATCCATGGTCTATGCAAATCCTG---CACTTGGTTTATAGAGATCTTATTTAATTCATC------------
577578579580581582583584585586587588589590591592593594595596597598599600
P Y E A V L V H G F M L D E Q G K E M H K S S G
- Y . A V L V H - - - - - - - - - E M H K S - -
---AAT---ATTTTCACAATTACT---------------------------CCAGAATCTTTGCCT------
601602603604605606607608609610611612613614615616617618619620621622623624
N Y V E P S Q V V S K Y G R D T L R L W L L R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
T T W E D A K F S W K S L D M T R R D L N I I W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
N V Y V F A N T Y M S L D E F K Y S K Y S Y Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
I K D Y L K L E D I W L L S R Y Y R M L K E V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E A M K E Y K V H E L A N K V T T F I I D D I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R F Y L R V T R K R A W N E A N D P D K I A M Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Y V L Y H V L K G S L I L L S T V I P F A A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I Y L D F V Q E R L E S I S M E K I P E I K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
F I N E E I E E A F E I A K E I I D A G L N A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A K A G I K L R W P L K E V Y V F L V S D K D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R S I E K I T D V L S S L L N S K S I I I E G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
D G Y K R F S K I R A T P N T G S I G P T F K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L S V K V A E Y I Q N N S D K V A Q D I V S K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
Y H E F N V D S E N L R L D I S H V N L V E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
E K G Y A S A R F S K G V V L L K Q E M S K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
E E E G I I R D L I R R I Q F M R K Q L S L N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
N E Y I L L S I R A P N D K V D L I K K W E Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
I K N E T R A K E L R I G D V S G D L I Q D W D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
V E E E T Y T I G V S K A D V S V S
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_ile_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G A G E M A E A L G E E L E R E I Q R R W E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M D L L S K V L E K N R D G P L F Y F L D G P P
- - - - - - - - - - - - - - - - - Y F L D . P P
---------------------------------------------------TACTTCCTCGAC---CCACCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y A S G S I H L G T A W N K I I K D A V N R Y K
Y A S G S I H L G T A W N K I I K D A V N R Y -
TACGCGAGCGGCTCGATTCACCTCGGTACAGCCTGGAACAAGATCATCAAGGACGCCGTGAACCGGTAC---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L M R G Y R V R L Q P G W D C H G L P I E V K V
- - - - - - - R L Q P G W D C H G - - - - - - -
---------------------CGACTGCAGCCCGGTTGGGACTGCCACGGT---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E Q E V L S D E I E C K K D I E E K V G V D K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V E K C K E F A L K H V E I M T E Q F K R L G V
- - - - - - - - L K H V E I M T E Q F K R L . .
------------------------CTGAAGCACGTAGAGATCATGACGGAGCAGTTCAAGCGTCTG------
145146147148149150151152153154155156157158159160161162163164165166167168
L M D W D N P Y M T L D N E Y I E G A W Y T L K
. . D - - N P Y M T L D - - - - - - - - - - - -
------GAC------AACCCGTACATGACCCTGGAC------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R A H E R G L L D R D V R I V N W C P R C E T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L A D H E V E Y K E V E D P S I F V I F P I E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D S D A E V D L P E N S A L L I W T T T P W T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P A N L A V A V H P E E E Y V L A R A E V D G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E W H L I V A D K L K V V L S V V T D S Y E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D S F P G E A L E G L R Y R P P L W E E V P K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R E L H E E D D R V H R V Y T A E W V T M E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T G C V H S A P G H G E E D F E L G R E V G L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P H C P V A E D G T F T E D G G K Y E G L Y V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D A N E K I V E D L R E K G L L A H E D T V E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R Y G H C W R C K T P I I Y R A T E Q W F L K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T E V K D E M L E W I E R V E W I P E W A G H S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R F K S W V E N A R D W C I S R Q R Y W G I P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P V W E C E E C G H L E V I G S L S E L E A K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V S L P P G E P D L H R P W V D E V V L K C P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
C G S Y M R R V P D V L D V W V D S G V A A W A
- - - - - - - - - - - - D V W V D S G V A A W -
------------------------------------GACGTCTGGGTAGACTCGGGAGTCGCCGCGTGG---
553554555556557558559560561562563564565566567568569570571572573574575576
S L G Y P R R E D E F E R W F L K E G R C D P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D P E A G A D F I T E G H D Q T R G W F Y S Q L
- - - - - - - F I T E G H D Q T R G . F Y S Q L
---------------------TTCATCACCGAGGGTCACGACCAGACCCGCGGA---TTCTACTCGCAGCTA
601602603604605606607608609610611612613614615616617618619620621622623624
G C G V V T F D T C P Y R T V L M H G F T L D E
G C G V V T - - - - - Y . T V L M H - - - - - -
GGTTGTGGCGTCGTCACC---------------TAC---ACCGTGCTCATGCAC------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E G R K M S K S L G N V V D P M D V V E K Y G A
- - - K M S K S - - - - - - - - - - - - - - - -
---------AAGATGAGCAAGTCC------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D T L R W Y V L R S N A P W R D M H F S W Q D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R D T H R A L N V L W N A Y R F T K M Y S E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E F D P E E H P L E D L E E H L K P E D R W L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S R I N S L V E E V T D A F E R Y H V H E A A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A L Y R F V T E D L S R W Y I R L V R E R V W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E G D D P E K L A V Y A V L H Y T F D R L V R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L A P I V P H V A E R I Y L D Y V R A G D D P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
S V H L T D W P E V D D R W V D E G L E K A M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L V R K A A E A A L S V R Q R A G V K T R W P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
R R L F V E V E D P K R L E D L K D V L A R V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
N V K E V E L G E E F P E K V P V A E P R P D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
I G P E F R S L A G R V I E H V K D R A E E V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
R S I L K D G E Y R T E L D G E D V V L T E E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
V K V T E D L P E G W E A E E F E G G R V Y V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
V E L D E E L K S E A W A R E V V R R V Q E M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
K E L D L N L E E R I R V W I E T D E E I A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
V E E H S E Y V R G E T R A D E L H V N E G W P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
E E V D L E R E W E V E D R T I R I A V V V S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_ile_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q E V T S S F T P R V I E A S V Q K F W T Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D I Y A R V Q E Q N R D G K T W F F V D G P P Y
- - - - - - - - - - - - - - - - F F V D . P P Y
------------------------------------------------TTTTTCGTAGAT---CCGCCATAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T T G H I H L G T A W N K I L K D S I L R Y K R
T T G H I H L G T A W N K I L K D S I L R Y - -
ACCACCGGGCACATTCACCTTGGAACAGCATGGAATAAGATCCTCAAAGACAGCATTCTCCGGTAT------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M H G L H V I D R A G Y D M H G L P I E V R V E
- - - - - - I D R A G Y D M H G - - - - - - - -
------------------ATCGATCGTGCCGGATATGATATGCACGGC------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H E L G F E N K K D I E A F G I G A F I E R C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q F A L S H K D I M S E Q F K S L G V W M N F D
- - - L S H K D I M S E Q F K S L . . . . N - -
---------CTCAGCCATAAAGACATCATGTCAGAGCAGTTTAAATCTCTC------------AAC------
145146147148149150151152153154155156157158159160161162163164165166167168
D P Y Q T I M P E Y I E A A W W T L K Q A D E K
D P Y Q T I M - - - - - - - - - - - - - - - - -
GATCCCTACCAGACCATCATG---------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G L L D R G H R V V N W C P R C E T A I A D S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V E Y W D E Q D P S I F V K F P I H G L M N E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L V I W T T T P W T L P A N V A V A V D K D F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y A R V E A I K E G K K E I L W I A K D L V E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V L K R G K Y Q D Y S I L S E K T G E E L A G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T Y D S P L A D L I P R Q K E I V H T V V T A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F V E M D N T G M V H I A P G H G W D D Y L L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V E K G L D V F C P V D G A G Y Y T D E G G I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A G Q F V R D A N E K I L S D L G S H L L G R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K I T H R Y G H C W R C K T P I I Y R A T E Q W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F I S V P K M K E K M L S E I K A T S W Y P D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A G S A R F Y D F V S D A R D W C I S R Q R Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G I P I P V W Q C S S C S A H R V F G T V A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N A A A G S N L T D P H R P Y V D E I T V P C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
C G G T M K R V E D I F D V W F D S A M A S W A
- - - - - - - - - - - - D V W F D S A M A S W -
------------------------------------GATGTCTGGTTTGACTCGGCAATGGCATCCTGG---
529530531532533534535536537538539540541542543544545546547548549550551552
T L G F P R N D A L F H E M W P A D F I T E G Q
- - - - - - - - - - - - - - - - - - F I T E G Q
------------------------------------------------------TTTATCACTGAAGGGCAG
553554555556557558559560561562563564565566567568569570571572573574575576
D Q T R G W F Y S Q L G A S T I A F N R S P Y K
D Q T R G . F Y S Q L G A S T I A - - - - - Y .
GACCAGACCAGAGGA---TTTTACTCACAGCTTGGTGCCTCTACGATTGCC---------------TAT---
577578579580581582583584585586587588589590591592593594595596597598599600
S V L M H G F A L D A D G R K M S K S L G N V V
S V L M H - - - - - - - - - K M S K S - - - - -
AGCGTCCTGATGCAT---------------------------AAGATGAGCAAGAGT---------------
601602603604605606607608609610611612613614615616617618619620621622623624
T P E E V V Q K F G V D V L R L Y I L S S N A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
W E D L K F N W D G V S T V N R T M N I L W N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y R F P L P Y M I L D G F S P A Q T S D G K Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
D E Y I V R S Y R E M P E I D R W I I S R I N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
I A R S V S A D M D E Y Q L H R V T R L L M N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
I L E D L S R W Y V Q I V R P R M W L E E D S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D K K F A Y E T I T Y C L R T L C R L L A P F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
P H I T E A M Y E N L R L P E D P V S V H M L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
W P A G D I R L I D E N L E R R M D V V R K F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E A V A N A R Q A G K R K L R W P V Q N V I V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
T S S E S V I E A F R S M E D L A K D R A N T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
N I E V I Q G S W E R M R F N A E P V M K K I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
P S F G K K G P V V K G L I E A A D G S A L R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
Q L E E S G S V T L S D G S E E F V L T A E H M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
T F S Q H L P E G I F G A E M T D A S V Y V D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
T L T E D L E A E G Y S R E I I R R L Q E M R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
Q L D L N V E D N I V I D A V I E D V H L R E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
L S A S W L D L I K Q E V R G K T L K I H D S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
G G R D G S V L F Q L D R D W D I E G V N V T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
G I S L A G
- - - - - -
------------------
Class I
Archaea/Archaeoglobus fulgidus/amino acid sequences/ile_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L P A K Y S P K D V E S E I F K F W E D N D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y R K V K E K G G R K F Y F V D G P P Y T T G R
- - - - - - - - - - - - Y F V D . P P Y T T G R
------------------------------------GCTCTTTATGTA---TTCCCAGCCTTTGACGAGCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I H L G T A W N K V L K D T I L R Y K R M M G F
I H L G T A W N K V L K D T I L R Y - - - - - -
GGCATCCATCTCCACTGTCGTTTCAATGAACTCCTCGACGTCGAGGTCGAGCTC------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A P T D T P G W D M H G L P I E V K V E Q E L G
- - T D T P G W D M H G - - - - - - - - - - - -
------AACAACCTCTCTGGCAAATGCCTCCCTCAC------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F R T K R D I E S F G I D K F I E R C M N Y A L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------GTC
121122123124125126127128129130131132133134135136137138139140141142143144
A N K D A M T E Q F K S L A V W M D W E N P Y M
A N K D A M T E Q F K S L . . . . D - - N P Y M
AAGCTCCACACCATCGAAAACGAGCTTTTCGGGAATCTC------------CAC------CGCAAATTCCCC
145146147148149150151152153154155156157158159160161162163164165166167168
T I K A E Y M N A A W F A I K R A H E R G L L E
T I K - - - - - - - - - - - - - - - - - - - - -
AGCCTTTTC---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R K K M V V N W C H R C E T A L A D A E V E Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D E E D P S I Y V K F P V K G E K D T Y I V I W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T T T P W T L P A N M A V A V H P S L E Y A K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R A V K D G K V E Y L I L A K E L A D S V L G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G D Y D S W E V V E T Y L G E D L E G L E Y E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P L A D E V P L Q K N W K H Q V F F A D F V T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E N T G C V H I A P G H G V E D Y E L G V E K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L E V F N P V D D R G V Y T E E A G K Y A G K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V K E A N D D I I D D L Y R K D L L L A E E R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V H R Y G H C W R C K T P I I Y R A T E Q W F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K I S E L K D E M L E E I D K V M W I P E W A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S A R F K D W V S N A K D W C I S R Q R Y W G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P I P V W I C E K C G E M K V V G S I N E I E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E N D L D L H R P K I D A V T F S C Q C G G V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R R V P D V F D V W F D S G V A S W G S I A Y P
- - - - - - - D V W F D S G V A S W - - - - - -
---------------------TGGAACTCTCCTCATTACCCCTCCGCACTGACA------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L R K D K F E E L W P A D F I T E G H D Q T R G
- - - - - - - - - - - - - F I T E G H D Q T R G
---------------------------------------TATCTCGTTAATGCTGCCGACAACCTTCATCTC
553554555556557558559560561562563564565566567568569570571572573574575576
W F Y S Q L G T S V V C F D K A P Y K A V L M H
. F Y S Q L G T S V V C - - - - - Y . A V L M H
---GCACTTTTCGCAAATCCAGACAGGAATGGGGAT---------------CCT---TATGCACCAGTCCTT
577578579580581582583584585586587588589590591592593594595596597598599600
G F T L D E Q G R K M S K S L G N V V E P E E V
- - - - - - - - - K M S K S - - - - - - - - - -
---------------------------CGCACTTCCCGCCCA------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
V G Q I G V D G F R L Y V L Y S A P W E D L R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S W E E A R N I N R M L N V V W N A V R F A H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y M S L D N Y S F G E K G E L K I E D R W I L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R L E S F I K E A N E A M E G Y Q V H R V V R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
F F D F F V E D F S R W Y I Q I I R P R V W E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R D S P S K L A A Y Y T M F R V I D R S L R A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A P F A P L I A E W F Y Q H V V K E F R E G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S I F M E E Y S T A E V E M I D G E L E A A M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V A K E I V E A A A N A R N K A K R K L R W P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R E L V I E S G S E K V R K A V E M L E E T I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S Q C N V K Q V R V V D S F E K E I E I K P N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K Y I G P L L K E K A G E F A K Y V A S L K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
P E K L V F D G V E L D P K Q A I V V D Y R L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
E G Y E Y A E F S G G V V Y I Y K E L D D E L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
R E A F A R E V V R R I Q E M R K E L D L D V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
E F I E T T V E M D A E L V K G W E D Y I K S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
T R S Q K L V F G K A E G Y V R E W N I E G K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
6100710081009101010111012101310141015101610171018
V K I G I K R L R G
- - - - - - - - - -
------------------------------
Class I
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_ile_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P I Q E A E K S Y R P H R I E E K V Q S F W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E R D I Y E R V K E L R E D R P R Y S F L D G P
- - - - - - - - - - - - - - - - - - S F L D . P
------------------------------------------------------CCTCTGGGGTTC---GAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Y C S G R I H L G T A W N K I M K D T Y L R F
P Y C S G R I H L G T A W N K I M K D T Y L R F
TTCCCTGAATTCTTCGCTGCATTTAACTGACACCTCTATGCTGGCCTCAACGTCCAGGTCAAGGTCCTTCCT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K S M K G F N V R R Q P G W D T H G L P I E H K
- - - - - - - - R R Q P G W D T H G - - - - - -
------------------------TTCCCGGGCCATTGCCTCGCTCATGATCTC------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V E G L L G V R S K K D I E D K I G I E E F V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K C R E F A V E N K A V M T G Q F Q R L G V W M
- - - - - - V E N K A V M T G Q F Q R L . . . .
------------------TTTCTTGCCATCAGTTTCAACCGTGAACTCACCATCGGAGTC------------
145146147148149150151152153154155156157158159160161162163164165166167168
D W D D P Y V T F D P A Y M E S C W W T L K R A
D - - D P Y V T F D - - - - - - - - - - - - - -
CAC------TCCGTCTGCGCCTTCCAGTTC------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
H E K D L L V R D L R V I T W C P R C E T A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L A E I D Y H D K E D P S I Y V K F P V S G D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H I L V W T T T P W T L P A N M A V A V H P D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E Y A Y A R L D G E T Y I M A E A L V E K V L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E E A E I L K R V K G T E L E G L T Y R H P L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D E V P L H R E I E H R V I L G D H V T L T E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T G C V H T A P G H G P E D F E I G K K Y G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V I C P V D E A G I F T E E A G K Y S G R F V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D A D E D I I A D L R S K G L L L K A G T I S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R Y G F C W R C K T P I I Y L A T E Q W F L K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T E I K D K M L R E L D R V Q W V P S W A G E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R F R N W I E N A R D W T I S R Q R Y W G I P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P I W I C E E C D S I H V V G S I D E L R E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V E G E L E G D F I H R P H V D R I V L E C G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
C G G R M K R T P D V L D V W I D S G V A G W A
- - - - - - - - - - - - D V W I D S G V A G W -
------------------------------------GGCTGCCCAGCCAGCCACCCCGGAGTCTATCCA---
529530531532533534535536537538539540541542543544545546547548549550551552
A L H Y P S E T E L F R E W F P Y D F I T E G H
- - - - - - - - - - - - - - - - - - F I T E G H
------------------------------------------------------GACTATCCTGTCCACGTG
553554555556557558559560561562563564565566567568569570571572573574575576
D Q T R G W F Y S Q L G C G V I A L D E V P Y R
D Q T R G . F Y S Q L G C G V I A - - - - - Y R
GGGCCTGTGGATGAA---TCCCTCGAGTTCTCCCTCCACCGCCAGCTCCCT---------------TCCAAC
577578579580581582583584585586587588589590591592593594595596597598599600
R V L M H G F T L D E E G R K M S K S L G N V V
. V L M H - - - - - - - - - K M S K S - - - - -
---GTGTATGCTGTC---------------------------GGGTATTCCCCAGTA---------------
601602603604605606607608609610611612613614615616617618619620621622623624
E P E D V I E K Y G A D V L R F Y L L W E N K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
W E D L K F V W D E L R N V N K M F N I L W N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y V F A T T Y M S L D R F Q P G D H S A E D L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F R D E D R W I L S R I N S V A L K V T E A I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
N L H F H R A T R E I H D F I V E D L S R W Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R L I R S R T W I E R D D P D K L A A Y H T L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
T V L K T L I V T L S P M A P H V C E D I Y Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L V R G A E P D S P E S I H M L D W I L D E G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V D S Q L E A D M D I V R E I I E A C A R A R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
T A R Y K L R W P V R E M V V V S E D E G V L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A A E S L K N V I A E Q A N A K S I K T S T E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
P D M K I I A R P N P A T L G P R L R Q D I P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
V M R E L E G A D G S A V K A A L D S D G E F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
V E T D G K K F K L T S E D I V F E T E L P E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
I V S A Q F D G G S V F I D T E L T P E I M S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
A M A R E L V R R I Q D M R K D L D L D V E A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
I E V S V K C S E E F R E L T E P Q R E F I E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
E V R A S T L S F D Y S E L E Y T K E W K I S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
E N L I I S I K P A K V
- - - - - - - - - - - -
------------------------------------
Class I
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_ile_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P H G D L P L P P S Y R P H E V K K A V E E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W R R N R I F E K W K S W R G G P K F T F L E G
- - - - - - - - - - - - - - - - - - - T F L E .
---------------------------------------------------------ACTTTCCTTGAA---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P P T T N G M P H V G H I R G R T Y K D V V I R
P P T T N G M P H V G H I R G R T Y K D V V I R
CCTCCGACAACTAACGGCATGCCCCACGTCGGTCATATAAGGGGCCGCACTTACAAAGATGTCGTCATAAGG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F Y R L L G Y D V W V Q G G W D M Q G M P V E W
F - - - - - - - - W V Q G G W D M Q G - - - - -
TTT------------------------TGGGTGCAAGGCGGCTGGGATATGCAGGGA---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E V E K K L K L R S K K D I E Q F G L E K F A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E C N S L V E E Y L A Y W R E W G T K R L G L W
- - - - - - E E Y L A Y W R E . G T K R L . . .
------------------GAGGAGTACTTGGCCTATTGGAGGGAG---GGTACTAAAAGGCTG---------
145146147148149150151152153154155156157158159160161162163164165166167168
L D L E N A Y E T R Q P H Y L Q Y A W R I V K R
. D - - N A Y E T R Q - - - - - - - - - - - - -
---GAT------AACGCCTATGAGACTAGACAG---------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A H E L G L L T E D Y R V L W F C P R C E T S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S D H E V A L G Y D E R E D P S I Y V K F R V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G G V D E Y L V I W T T T P W T I V D N E A V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V H P D Y V Y A K V E V E V G G R R E Y W W L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E A L V P S L M A K F G I K T W R V V E T K K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V E L A G V R Y I H P L A E E V P E R A S R P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q V V T A E F V T L E Q G T G L V H I A P G H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P E D F E L A K K Y G L P V T N S V E I N G I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N E L G G R Y K G K H V Y D V D K E V T R D L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S K G L L V F E E K I R H E Y P H C W R C G S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L I L R A D R Q W F I A I S R I R D K M Y A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q K V N V V P T K L R D R F D I F V Q N A R D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N I S R S R V W G T P L P V W R C K K D G R I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V I G S L E E L K K L A K E L P P V D D F K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H R P W I D Q V K I S A H D C D E W V R E P Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
M D V W L D S G I A W I A A V D G E N N R D L W
- D V W L D S G I A W I - - - - - - - - - - - -
---GACGTCTGGCTGGACTCAGGCATTGCGTGGATA------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E K L F P Y D F V T E G I D Q T R G W F Y S L L
- - - - - - - F V T E G I D Q T R G . F Y S L L
---------------------TTCGTCACAGAGGGCATTGACCAAACCCGCGGC---TTCTATTCGCTACTC
577578579580581582583584585586587588589590591592593594595596597598599600
A T S V L Y T G R A P Y K N V L I Q G L I L D K
A T S V L Y - - - - - Y . N V L I Q - - - - - -
GCAACGTCTGTATTATAC---------------TAT---AACGTGTTGATTCAA------------------
601602603604605606607608609610611612613614615616617618619620621622623624
H G Q K M S K S K G N V I W A K D L F E K Y G A
- - - K M S K S - - - - - - - - - - - - - - - -
---------AAGATGTCTAAAAGC------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D P V R L Y I L S K V A P W E D L S F D P D E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K Y V I G D L N I L W N V V K F A D T Y M S L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G F D A E K Y P L S Q W L E K G L E E D K W I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
S E L N I M I S E F T N F V K N F E F H K A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L W R E F V V E T L S H R Y I R L L R R R V W S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E E P S P D K Y A A Y A V L H D V L K K V L I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
G S I L V P F I T E Y L W Q A Y V R K Y E K N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P E S V H L A Q Y P A A G S Y D K E L I Y A Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E L F A V F S A L A E A R N K A G I K L R W P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R E A Y V N G A K Y A E R Y T E L L K Y L G N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K E V K V G R R P D Y L C V K E G E L E V C V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
D K I E P E L Y Y E A L A R E L I R R I Q V M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
K E T G L E I S D E I H V V V E T N S D D I K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
A V E Q Y R D Y I A R E T R A V K L I I D A V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981
Q G K E W D I S G E K V K I E I R K A Q A
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_ile_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T L R E I D S E I L K Y W K D K N I L E K I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S K G G S K K F V F L E G P P T A N G R P H I G
- - - - - - - - V F L E . P P T A N G R P H I G
------------------------CGTTTCATTTTT---GTATTCTGCGTGCTTATTGAGTGCTTCAAGGAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H A M T R T I K D I V L R Y N T M T D H K I Y R
H A M T R T I K D I V L R Y - - - - - - - - Y R
GTCATCAGACAGATCGAGATGCGTGATTATCCTGTCCGTATA------------------------GACCTG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R V G G W D C H G L P V E L E A E K H F G F H T
R V G . W D C H G - - - - - - - - - - - - - - -
TATCCTCCT---GAGCTCCCTTGCCAG---------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K S E I V N F G V E K F N Q Y C R E S I F R Y I
- - - - - - - - - - - - - - - - - - - - F R Y I
------------------------------------------------------------CTCAACCATGTC
121122123124125126127128129130131132133134135136137138139140141142143144
D E W K Q V D D L I G F S I D H N G D Y I T L R
D E W K Q V D D L I . . . . D - - G D Y I T L R
CGGATCTAGCCGAACTCCATCGATCTCCAC------------TGA------TCTCTGCACTTCAAGGCCGTC
145146147148149150151152153154155156157158159160161162163164165166167168
N D Y M E S E W F A L K T M Y N S G L L Y K D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T V V P Y C P R C E T S L S S H E V A Q G Y K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V K D P S V Y V R F K S A D E E N T Y F V A W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T T P W T L P S N E F L V V N P D M E Y S L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A Q G S R Y Y V A S S R A G Y I F K E Y R E I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R M H G R D L V G K R Y L Q L M P F L D P P S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S L K V V A G S F V T S E D G S G I V H A A P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F G A D D Y Q I G K E E G V E I L N P V D K N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R F A D P R I P W N G K F V R D A N E D I I V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L K K N Q M L L K S E K Y E H S Y P F C Y R C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T P L L Y Y P L D A W F I A V S R I R D K L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y N E R I N W K P D Y L K H G R F G N F L G E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K D W N L S R D R F W G T P L P A W R C K N G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L V F V G S R K E I E D L G G K V P E D L H R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y I D E V R F K C P T C G E E M S R E P Y V I D
- - - - - - - - - - - - - - - - - - - - - - - D
---------------------------------------------------------------------TGC
505506507508509510511512513514515516517518519520521522523524525526527528
T W F D S G S A T Y A A S H Y P F E K N F D P E
T W F D S G S A T Y - - - - - - - - - - - - - -
GCTTCCAGAGTCGAACCAAGTATCTATAAC------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T D V P V S F I T E A I D Q T R G W F Y V L H V
- - - - - - F I T E A I D Q T R G . F Y V L H V
------------------ATACGGCCTATGAAGGTCCTCTGGCACTTTGCC---TAGATCCTCTATCTCCTT
553554555556557558559560561562563564565566567568569570571572573574575576
I A T I M F N K N A Y E S A L S I N F I L D A Q
I A T I M - - - - - Y . S A L S I - - - - - - -
CCTGCTCCCGACGAA---------------CTT---TCTCCATGCTGGCAG---------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G R K M S K S K G N S V Y A L D F L N E V P P D
- - K M S K S - - - - - - - - - - - - - - - - -
------GAGGTTCCAGTCCTT---------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
S L R L F F L Y G A P W K S K N L D K K V I D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
V S R K T L M T V L N V Y S F F A Y N A N I D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
F Q W N G L Q L S G N A L D R Y M V S K V N S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
V R S S R D A Y E S L D F H E V V R A S M E F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
D D L S N F Y L R L S R R R F W A E G F D D D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L S A Y S T L Y Y A L K A F S E V M A P I T P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
F S D F I Y L N L G G D K E S V H L E A F P E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
D S T L M D E K L E S E M D R A Y S V I E T V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
R L R Q E N S I K G R Q P L R E I L I A G D M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E S I I D V V K S E L N A K D I K L I E R D Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
P I R L S A D L R M D R A A P V L R S R V N A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
R H K I R S M D G L E V Q R Q I S E K G F V E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
D G V R L D P D M V E I S R V P D P N Y A Y S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
T E K Y G I D V F I N K N I D R D G Y L E G L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
R E L V R R I Q V M R K E M N L N Y T D R I I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
H L D L S D D F L E A L N K H A E Y I K N E T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
S D S I I T D K V E G M K L W E I N G E P V R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014
K I D L A R
- - - - - -
------------------
Class I
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_ile_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y S P E I E K Q I L E Y W K S I G L T H R L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A K S L K S G K K W S Y L D G P P F A N D D I H
- - - - - - - - - - S Y L D . P P F A N D D I H
------------------------------TATTAAATCTTC---GCCTTTATAATCGATACCTTCTATTTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V G H A W G R A L R D S E I R Y R L M R G Y K I
V G H A W G R A L R D S E I R Y - - - - - - - -
TAACTTTATAGGTTGGTATTTCTTTAGTTTTAGCTTTTTCCTCGCTTC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y V R P G F D T H G L P I E V K L E K E H G F T
Y V R P G F D T H G - - - - - - - - - - - - - -
TATTAGGCCTTCCCTTATTAGATTGCTATC------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N K D D I I K Y G V D K F I E E A R Q F A Y K N
- - - - - - - - - - - - - - - - - - - - - Y K N
---------------------------------------------------------------TTCTATCTC
121122123124125126127128129130131132133134135136137138139140141142143144
I N K Q I S S F K R L G V L A D Y D N P Y F T Y
I N K Q I S S F K R L . . . . D - - N P Y F T Y
TTTAGGCAATTGCTTGCTTATATACAATTTTGG------------AAT------TCCATGCTTGTTTCTTAA
145146147148149150151152153154155156157158159160161162163164165166167168
D N N Y I E R I W K I I K K A W E E G L L Y K G
D - - - - - - - - - - - - - - - - - - - - - - -
AGA---------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K Y V V H W C P R C Q T A L A P N Y E V I Y K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V E D P S I F V K F P L K N E D A Y L L I W T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T P W T L P Y N L G V M V N P N A T Y V L V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E N G E K L Y I A K D R L I V L V T L G H K Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I L K E V Q G K D L E G L E Y Y P P F Y E E W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E I Y D E L K K Q Y K N V H T V W L S E E Y V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L E E G T G L V H A A P G C G P E D F E V G L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y N V P P F N D L K E D G S F V R E P F K G W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A K K D D D K F I E L L E K K G L L F H K D K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K H N Y P V C E R C K S K L I F R V T E E W Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K V T A Y K N K M I E E A S K V N W V P E K A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R A M L Q W L S N I R D W A I S R Q R F W G I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L P I W K C E N N H Y L V I S S K E E L E K Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G L T L K R F I I I V K H K E L D K D Y I K T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F G D F I E T D D V E S V I E K E K E A I I L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
N R D A N E L E Q K L K E K Y Y V Y R F G G D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y T I L R V Y S Y D L H K P W I D N I E I K C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V C G R P M K R E P D V L D V W L D S G G A F Y
- - - - - - - - - - - - - D V W L D S G G A F Y
---------------------------------------AGGAACCCAATTGACTTTAGATGCTTCCTCAAT
601602603604605606607608609610611612613614615616617618619620621622623624
A T F D N E E A Y K I F Y P F D F I L E G W D Q
- - - - - - - - - - - - - - - - F I L E G W D Q
------------------------------------------------TCTAAATATAAGCTTACTCTTACA
625626627628629630631632633634635636637638639640641642643644645646647648
I R G W F Y S L L G E G V L Y T N Q S P Y K N V
I R G . F Y S L L G E G V L Y - - - - - Y . N V
TCTCTCACA---AGGGTAATTATGCTTTATTTTGTCTTTATGGAA---------------CTC---TAATTC
649650651652653654655656657658659660661662663664665666667668669670671672
Y V S G F V L D E Q G R K M S K S L G N F I Y A
Y V S - - - - - - - - - K M S K S - - - - - - -
TATAAATTT---------------------------TTTAAATGGCTCTCT---------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R E L M E K Y G A D A V R L F T I Q A T G P Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
D L I L R I D G I K E K Q S N L N I L Y N I V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Y Y F D Q K E Y L K V N P E P K K L N I V D Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V I Y K I N K A I E E T I N Y F E N Y Q I W K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
P K P L E E F W L E L S R F Y I K V N R E R I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K S K D D A A T I L Y V L K Y S L D K L I R A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A P I I P F S A E Y L Y Q K M R D E L G Y K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S V H L L P Y P E P E K I E F Q Y L E E I E I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K K V I E M A N S L R N K H G I G I R W P L P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L Y I S K Q L P K E I E E I L K E V L N V K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
V Y T K E G I D D V I V N D I E V G L S F K L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
S N L I R E G L I R E T I R R I Q E A R K K L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
L K K Y Q P I K L K I E G I D Y K G F E D L I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
N R V N A E F S E N E E W D L V E E Y N I K G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
61007100810091010101110121013101410151016
K V K I F V K K
- - - - - - - -
------------------------
Class I
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_ile_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I K E P E F R D Y T P G K L E E K I E E F W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E N N I Y Q K I K E L R K N G P K Y Y F L D G P
- - - - - - - - - - - - - - - - - - Y F L D . P
------------------------------------------------------CAAGAGCTCGCG---GTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Y V S G A I H L G T A W N K I I K D M I I R F
P Y V S G A I H L G T A W N K I I K D M I I R F
ATCGGTTGTCTCTATTGTGACAACAATTCTATCATTGACGTCGAGGTCAAGCCTCTTTCTCATCTCTTGAAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R T M Q G Y N V W R Q P G F D M H G L P I E V K
- - - - - - - - W R Q P G F D M H G - - - - - -
------------------------CCCTTCAGCTAGCAGTTCCCTTGTAAGGGT------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V E Q A L G L K T K K E I E E K I G V E N F I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K C K E F A L N N L K I M T E Q F K M L G I W M
- - - - - - L N N L K I M T E Q F K M L . . . .
------------------GATCTCAACATCAACCTCTCCCTTCTCGTAGAGCTCGAGCCC------------
145146147148149150151152153154155156157158159160161162163164165166167168
D W D D P Y M T I K N E Y I E S A W F T L K K A
D - - D P Y M T I K - - - - - - - - - - - - - -
CCA------CACTAGCCTTGAATCTCCCTT------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
W E K G L L E K D K R V L H W C P R C E T A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E H E V R G E Y K L R K D P S I Y V K F P I E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K E N E Y L L I W T T T P W T L P A N L A V S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H P E Y D Y V K V K V E F N G K E E Y W I L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A L V D K V L G E I G V K G E V I E E F K G R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L E G L R Y I H V L M D E Y P R Q K E F R E K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E W A H R I I L A D F V T L E E G T G L V H T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P G H G E E D F E V G K K Y G L P I Y S P V D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q G R Y V E G K W K G I Y V K E A D P Q I I E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L K E K G Y L V K A G E I E H K Y P H C W R C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T P L I F R A T D Q W F L K V S K V K D R I I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E N D E K V T W Y P D W V K I R F D N G V R D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G D W V I S R Q R Y W G I P L P I W Q S E D G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I Y V V G S W R E L V E L A V A I E V N G E R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D L P E S Y E E K L K V I E E K L G P E D L H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P Y V D A F I I K V N G K E M R R V K D V V D V
- - - - - - - - - - - - - - - - - - - - - - D V
------------------------------------------------------------------TATAAC
553554555556557558559560561562563564565566567568569570571572573574575576
W F D S G I A S W A S L G Y P R N K E L F E K L
W F D S G I A S W - - - - - - - - - - - - - - -
CTTGAGCTTCTCCTCATAGCTTTCCGG---------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
W P A D F I V E G E D Q V T K W F Y S Q Q A A S
- - - - F I V E G E D Q V T K . F Y S Q Q A A S
------------CCAGGAGCCAACCACGTATATTTCCCCATCCTC---CTGCCATATTGGAAGTGGAATCCC
601602603604605606607608609610611612613614615616617618619620621622623624
V I A F D T V P Y R R V A M H G Y V L D E K G D
V I A - - - - - Y R . V A M H - - - - - - - - -
CCAGTAACG---------------CCAGTC---GCTGTCCCTAAC---------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K M S K S L G N I I R P E E V V E K A G R D T F
K M S K S - - - - - - - - - - - - - - - - - - -
GTCCGGATACCACGT---------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
R F Y M L W A T N P W E N L K F S W K G V E Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R R M L N I L W N V Y V L S A T Y M S L D N F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P R N V K V E E L A F R E E D K W I L S R V N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L I R E V E N G I E T F Y L T K A T R A L Y N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V V E D L S R W Y V R L I R K R L W V E G D D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
D K L A A Y Y T L W K V F D V L L R L M A P F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P Y I T E E I Y Q N L M R P F I G I E S V H M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
D W P K V D E S A V D E D L E K E M E F I R R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V E A G S A A R Q K A R I K L R Y P V R K I I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E T Q D E T V K K A V E R L N Y I L R D Q L N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
K E V V I G K V E R E L T V K P N F A K V G P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
F K G D S R L V A K W I N E H G L E L Y E K G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
V D V E I E G K K F H L T R E H I I V E E K L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
D F L V A E D F E G G R V Y V D K T L T R E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
A E G L A R E F V R R I Q E M R K R L D L D V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
D R I V V T I E T T D D N R E L L Q E N L D Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
M R E T R A I E V R F E E A K G Y V V E W P E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
Q A K I G I E K V E
- - - - - - - - - -
------------------------------
Class I
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_ile_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I K E I T A K Y N A E Q I E K K V T Q F W E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S D A Y R K T R E R R K T G K R L F F V D G P P
- - - - - - - - - - - - - - - - - F F V D . P P
---------------------------------------------------CAGGTCCTTCAA---TTCAAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y T T G H I H L G T A W N K I I K D T I L R Y Y
Y T T G H I H L G T A W N K I I K D T I L R Y -
GAGCGCTAAGACCTTTTCGGCCTCGATCCTGACAGAGACGCGGATGTTTTCGTCCACAACAAGGTCGAG---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S M N N R Y I L E R P G W D M H G L P I E V R V
- - - - - - - L E R P G W D M H G - - - - - - -
---------------------GCGGATGACTTCCCTTGCATATCCTTCAGC---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E G V L G F K S K K D I E S F G V E N F I E K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K E F A I T Q K Q A M T E Q F Q R L G V W M Q W
- - - - I T Q K Q A M T E Q F Q R L . . . . Q -
------------GGTGACTGGAACAGTGGTCCCGTCAGCCAGTGTGAGTTCAAA------------GGC---
145146147148149150151152153154155156157158159160161162163164165166167168
P E P Y M T L K D D Y I E A A W W T L K Q A H E
- E P Y M T L K - - - - - - - - - - - - - - - -
---TTTCTTTAAAGTAAAACCCTC------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K D L L E V G K R S V N W C P R C E T A I A D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E V E Y S E R T D P S I Y V K F K V K G E E N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F I V I W T T T P W T I P A N V A V A V H P A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E Y S K F R A I R Q D G S E E I L I A A T E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K N V L K Q G R Y A D F K V L E T M L G E E L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K L E Y E S P V G D L V P I Q N E I K H G V Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A D F V T V E N T G C V H I A P G H G M D D F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L G V K H K L P I L C P V G S N G A Y T E E A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E Y A G K N V R E A N P I V I E D L K A R N R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L A E G T V T H R Y G H C W R C K T P I I Y L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T E Q W F L K I T E I K E K M L E E I D A V D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y P D W A G S A R F R T W V E G A R D W C I S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q R Y W G I P L P V W K C K K C G K L E V I G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K A E L L E K A G L S G D I E L H R P Y V D R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T V P C E C G G E K K R V E D V F D V W F D S A
- - - - - - - - - - - - - - - - - D V W F D S A
---------------------------------------------------CGGGAACTTCAGGGTTGCCCA
529530531532533534535536537538539540541542543544545546547548549550551552
V A S W A T L K F P Q T H D Q F D E W W P A D F
V A S W - - - - - - - - - - - - - - - - - - - F
GGAAGCAACAGC---------------------------------------------------------ACA
553554555556557558559560561562563564565566567568569570571572573574575576
V T E G H D Q T R G W F Y S Q L G A S M V G F G
V T E G H D Q T R G . F Y S Q L G A S M V G - -
GGGCACGGTAACCCTGTCCACATAGGGACG---CAGTTCGATGTCCCCGCTTAACCCTGCCTTTTC------
577578579580581582583584585586587588589590591592593594595596597598599600
R A P Y K S V L M H G F T L D A G G K K M S K S
- - - Y . S V L M H - - - - - - - - - K M S K S
---------TGT---TATTACCTCAAGTTT---------------------------GAGCGGAATTCCCCA
601602603604605606607608609610611612613614615616617618619620621622623624
L G N V V S P L D I I D R L G A D T L R A Y V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S S S A P W E D L K Y N L E E V E T V H R S I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I L W N V F R F P L P Y M A L D N F D P M Q V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L D S V K D A L R E E D R W I L S R A Q S V I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A V N E A M S G Y L L H K A V R E I L E F A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D L S R W Y I Q L I R P R T W T E A D D P D K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A A Y C V L Y E V Y V T I T K L I S P F M P Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A E E M Y Q N L I R N V D P N A P E S V H M C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
W P K V N D T Y L D P E L E V A M D T V R S I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E A A S N A R Q K A G R K L R W P V S R I I V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
P E S E A A A K A V N R L G S V L M D Q T N S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
A I V L T G V G K S W D E L G L E V I P D P G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
I G P V F K K D A G R V I P A L Q K V E G F T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
K K A F A E T G E F E L T L A D G T T V P V T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
G M A N F K E T L P E G T A S A E S D A G L V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
V D A N L T P E L E A E G Y A R E V I R R L Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
M R K E L D L V V D E N I R V S V R I E A E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
L A L V E T L K D L I A E E V R A D V F D L G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
S I E V S G T L V K D W D V E G T A M K M G I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
21043104410451046104710481049105010511052105310541055105610571058
K K
- -
------
Class I
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_ile_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K R F K Q V E Q F R H P E I E H E V L R W W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E R Q I F P R S I A Q R E N G P T F S F Y E G P
- - - - - - - - - - - - - - - - - - S F Y E . P
------------------------------------------------------TCCTTCTACGAA---CCG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P T A N G K P G I H H V L A R T I K D I F C R Y
P T A N G K P G I H H V L A R T I K D I F C R Y
CCCACGGCCAACGGCAAGCCCGGCATCCATCACGTCCTGGCCCGGACGATCAAGGACATCTTCTGCCGCTAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K T M K G F R V E R K A G W D T H G L P V E I E
- - - - - - - - E R K A G W D T H G - - - - - -
------------------------GAGCGGAAGGCGGGCTGGGACACGCACGGG------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V E K E L G L E G R A Q V E A F G I E K Y N A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
C R R S V L R Y K E L W D Q L T E R I G Y W V D
- - - - - L R Y K E L W D Q L T E R I . . . . D
---------------CTGCGCTACAAGGAACTCTGGGACCAGCTCACGGAGCGGATC------------GAT
145146147148149150151152153154155156157158159160161162163164165166167168
L E H P Y I T F E N T Y I E T V W W L I K Q I Y
- - H P Y I T F E - - - - - - - - - - - - - - -
------CACCCGTACATCACATTCGAG---------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E K G L L Y K G Y K I Q W Y S P G S G T V L S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
H E V S L G Y K E V D D P S A Y V R F P V L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E R T Y L L A W T T T P W T L I S N V A L A V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A D I T Y V K V R R E D P E R G T E Y L I L A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D R L D V L R D E S V E V V E T F P G R A L V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T R Y E P L F P Y F K D R F K E G E A W R V I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A D F V S T E E G T G I V H L A P A F G A E D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E A A Q K E G L P L I N P I T P E G T F T D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S L V A G L W F K D A D K V I L R D L R Q R G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L F R Q E T Y R H N Y P H D W R K G T P L M N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P V E S W F I R T T A V K D R M I A L N E T I H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
W H P P S I G E G R F G E W L R N N V D W A L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R Q R Y W G T P L P I W Q S D R N P D Y I E V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G S I E E L R Q K L G G T F P P E A Y N P E T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E L D L H R P F V D R L T W P A P D G G T M R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V P D L I D V W F D S G A M P F A Q W H Y P F E
- - - - - D V W F D S G A M P F - - - - - - - -
---------------GACGTCTGGTTCGACTCGGGGGCCATGCCCTTC------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
N Q E A F R R T F P A D F I A E G V D Q T R G W
- - - - - - - - - - - - F I A E G V D Q T R G .
------------------------------------TTCATCGCCGAAGGCGTCGATCAGACGCGTGGC---
577578579580581582583584585586587588589590591592593594595596597598599600
F Y T L H A I A T M V M D S V A F R H V V V N G
F Y T L H A I A T M V - - - - - F . H V V V N -
TTCTACACGCTGCACGCTATCGCCACGATGGTG---------------TTC---CACGTGGTGGTCAAC---
601602603604605606607608609610611612613614615616617618619620621622623624
L V L D E K G E K M S K S K G N V V D P F D V V
- - - - - - - - K M S K S - - - - - - - - - - -
------------------------AAGATGTCCAAGTCG---------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E R Y G A D P V R W Y M I S N A P P W E N I R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S E R E L D A T R R R F F N T L E N V Y A F F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
T Y A N V D G F V Y P A E R M P V G E R T E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
R W I I S R L N S T V A E V E A A Y E D Y H P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R A A R A I E R F V D E L S N W Y V R R S R R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
F W S A R T G E Q E N E R D K Q A A Y Q T V Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
C L E T T A L L M A P I A P F F S E W L Y R A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
Q E G S E V K G P E S V H L A D F P K V D R A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I D P V L E Q R M A L A R T I V S I V L A L R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
Q A R I N V R Q P L P R I L V V T G T G V D R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V V E S V R P L I L E E V N V K D I E Y V E G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
S R V V R R T A R P N Y P R L G K R L G K L M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
G V A A R V A Q L T E E E I D R Y L R E G K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
L E V D G Q Q V E L G P E D L E I K S E G I E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
W L V G Q E D G V T V A L D T N R T E E L M L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
G L A R E A I N R I Q N L R K K A G F E V T D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
I V V S Y R A E G Q L A R A L A R H A D W I R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
E T L A V A L Q P S E Q P T G T H V E T F D I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
G E T F T V G V Q R V P V A T T T G Q R A
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Archaea/Staphylothermus marinus/Smarinus_ile_aa
Archaea/Staphylothermus marinus/Smarinus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P I I G K L K G Q Y D P H K V E E W V K R F W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D E N Q I Y K L V K E K S D R S I L R F N F I D
- - - - - - - - - - - - - - - - - - - - N F I D
------------------------------------------------------------AACTTTATAGAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G P P Y P S G D V P H I G T A W N K T L K D I V
. P P Y P S G . V P H I G T A W N K T L K D I V
---CCACCTTATCCAAGCGGT---GTCCCTCATATTGGTACAGCTTGGAATAAAACGTTAAAAGACATTGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L R Y K R M R G Y N V F D R P G Y D C H G L P I
L R Y - - - - - - - - F D R P G Y D C H G - - -
CTCCGCTAT------------------------TTTGATAGGCCGGGATATGATTGTCATGGT---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E V K V E Q K L G V K V K R E I E E K I G V D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F V N E C K K L V F N N I K S L T K W F K E L G
- - - - - - - - - F N N I K S L T K W F K E L .
---------------------------TTTAACAATATTAAGAGCTTGACTAAATGGTTTAAAGAACTA---
145146147148149150151152153154155156157158159160161162163164165166167168
V F M D W E N P Y L T L R D E Y I E A G W W L I
. . . D - - N P Y L T L R - - - - - - - - - - -
---------GAT------AATCCGTATCTAACCCTTAGA---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K K A A E Q G L L D R E E R V V Y W C P R C S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T L A E Y E V E Y K V L T D P S I Y V K F P V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S R E K E Y L L I W T T T P W T L P A N T F V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A H P D I T Y V R V R V G E E V Y I L A K P R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E K V M S E A G I K E Y E V L E E F P G K K L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G L E Y D H P L I D I V P L Q E K L S K Y H R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V M A P E F V T T T E G T G L V H G A P G H G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E D F T V A K K I G I D F I A S P I D D E G R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T N V A G K Y A G K K V R E A N P E I I K D L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E R G A L L H A S Q I T H K Y P V C W R C K T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I V M R A T K Q W V L R V T K L K E K L I N E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K K V N W I P D W A L D R M M H M L E N L Q D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V I S R Q R Y W G T P L P I W E C P E G H R I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V G S I N E L E K H G G K K P K E L H R P W I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E V E I K C P I C G R P M K R V P D V M D V W F
- - - - - - - - - - - - - - - - - - - - D V W F
------------------------------------------------------------GATGTATGGTTT
529530531532533534535536537538539540541542543544545546547548549550551552
D S A I S F Y A A N G H P E K L R L E D V I L D
D S A I S F Y - - - - - - - - - - - - - - - - -
GACAGCGCCATCTCATTCTAT---------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F I V E G H D Q I R G W F F S L L R A G V L G F
F I V E G H D Q I R G . F F S L L R A G V L G -
TTTATAGTGGAAGGCCATGATCAAATACGTGGA---TTTTTCTCACTACTACGAGCAGGAGTCCTGGGT---
577578579580581582583584585586587588589590591592593594595596597598599600
Q S K P Y N T V L V H G F A L D E H G R E M H K
- - - - Y . T V L V H - - - - - - - - - E M H K
------------TAT---ACGGTCTTAGTTCAT---------------------------GAAATGCATAAG
601602603604605606607608609610611612613614615616617618619620621622623624
S L G N Y V G T D E A I E R A G R D P L R F W V
S - - - - - - - - - - - - - - - - - - - - - - -
AGT---------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S Q N T V W E D L R F S W R G I D E I R R D L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I A W N T F V F A S T Y M N L D K Y D P L Q H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
I D D Y K E F L R Y E D K W L L S R I N S I A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
K I T E S L E K Y Y I H E A A R E L R K F I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D V S H W Y I R L I R P R V W V E E N T P D K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A A Y S V L Y Y V L E K W L R M M A P F T P F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A E K I Y Q E V F R K A N P E L P L S I H L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
W P S I D D E Y I D E D L E K I M N V I R E I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E A A A A A R M K A G I K L R Q P V K S L T V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
T D R E R I R E V T R K Y S G L L A R L V N V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K V E A K Q V A E I G K I V K Y K V S P I Y R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
I G P L Y R K L A K K V I N Y I M E N Q E S I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
R D I I R K G E H T A Y I E G Q E I K L T K E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
V L I T P S Y V E G Y S V E E R E W G S V A I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
T R L S K E E I A E G L A R D I I R R I Q V M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
K E I N L P L D A K I E T Y I Y A P R K H V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
L K P Y T E Y I K N E T R S E K L T Y L D T P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
Q L E K I Q G Y R K E W E I Q G E Q Y I I V I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
21043104410451046104710481049105010511052105310541055105610571058
Q L
- -
------
Class I
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_ile_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K V E P V N F R E L D K K I K K F W E E N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y Q K V K K K N E R N K E F Y F V D G P P Y C
- - - - - - - - - - - - - - - Y F V D . P P Y C
---------------------------------------------TTCCCTCTCAAT---CTCCTTAAATTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S G A I H L G T A W N K I I K D T Y L R F K R M
S G A I H L G T A W N K I I K D T Y L R F - - -
ATCTAAGTCAATGCCCTCAACTTTAATTTTAATCTTCTCCTCAATATCTAAATCCATATCCTT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q G Y N V L D K A G W D M H G L P I E V K V E N
- - - - - L D K A G W D M H G - - - - - - - - -
---------------AACCTCTCTCATTAGCCCCTCTTTTATCAA---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E F G I K N K K E I E T K I G V K Q F I E K C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E F A L K H K E I M E K Q F K N L G V W L D W E
- - - L K H K E I M E K Q F K N L . . . . D - -
---------ATATCCATCTAATATTACAGCTCCTTCTTTCAACCTCTCCAT------------ATC------
145146147148149150151152153154155156157158159160161162163164165166167168
N A Y M P I T K E Y M E I G W W T L K V A H E K
N A Y M P I T - - - - - - - - - - - - - - - - -
ATTTAATGCCTCAACAACCTT---------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G L L T R D L R V V Y W C P R C E T A L A E H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V R G E Y K E V Y D P S V Y V K F R L A N E E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T Y I V I W T T T P W T L V A N L A V T V H P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y D Y A Y V E V E F D D K K E V W I I A E K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E E V I N K A K K F H N I K N Y K I I K K V K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K E L E G I K Y I H P L L E E N E R Q K E F A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L E N A H T V I L G E H V T L E G G T G L V H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A P G H G E E D F E V G K K Y N L P I Y S P I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D E G K Y V E G K W K G V F V K D A D A E I I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T L K N K G L L V Y A G K I K H S Y P H C W R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K T P L L F R A T E Q W F L E I S K I K D N I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E H A K T V Q W I P H W V E T R Y I N G V K F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G D W N I S R Q R Y W G I P I P V W V C E K C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K Y I V V G S V E E L E E K M I N K D E V G E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
N D L H K P T V D K I K L R C E C G G E M K R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P D V L D V W F D S G L A P Y A S I G V K E L K
- - - - D V W F D S G L A P Y - - - - - - - - -
------------GTGTAAATCATTAATCTCTCCAACTTCATCTTT---------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K A D F I T E G H D Q V T K W F Y S Q H A L S A
- - - F I T E G H D Q V T K . F Y S Q H A L S A
---------TACAACAATGTATTTTCCACACTTCTCACACAC---TACTGGAATAGGGATTCCCCAGTATCT
577578579580581582583584585586587588589590591592593594595596597598599600
I V F N D I P Y K K C L M H G F T L D E H G D K
I V - - - - - Y K . C L M H - - - - - - - - - K
CTGCCT---------------TCCAAC---CTTAACTCCATT---------------------------TAT
601602603604605606607608609610611612613614615616617618619620621622623624
M S K S L G N V V N P D D V V E K Y G A D L L R
M S K S - - - - - - - - - - - - - - - - - - - -
CCACTGAACTGT------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
F Y L L S A N K V W E D L R F V W S E M D D V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S L F N T L W N A Y M F A V N Y M V L D N F K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
D E K Y F E Y L K D E D R W I V S R I N S V A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
I A I E N L E V P Y F H T Y T W T L K D F I L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D L S R W Y I R L I R D R T W K E K D D A D K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A A Y Q T L Y Y V L L K L A T I L A P V A P H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A E A I Y Q N L K T E D M E E S I F M N K I E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
D E E F I D E E L E R D M A I V R D V V D A I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R G R D R I K Y T L R Y P L K E I T I A G G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V K K A V E R F E Y I I K E Q G N V K N I K F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E V E G S K Y I I K P N Y R E L G K R Y R S E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
P K V V E A L N K A D A K E L M E R L K E G A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
I L D G Y E I K P E Y V E I R L E I P E H I A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
V E F S K G T V F I N T E I T D D L I K E G L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
R E V I R R I Q A M R K D M D L D I E E K I K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
K V E G I D L D E F K E I I E R E V R G Q F V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
E I K A D Y E K D W E I K T P N G E K Y N V K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
4102510261027102810291030103110321033103410351036103710381039
A I E R I N K
- - - - - - -
---------------------
Class I
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_ile_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K R S Y S P L E V E E W V L R F W D K N K V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E K V K R M T W D E R P N A P L F A F L E G P P
- - - - - - - - - - - - - - - - - A F L E . P P
---------------------------------------------------CCTCTCCACCGC---CCGCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T A N G F M H V G H A R G R T L K D V K L R Y A
T A N G F M H V G H A R G R T L K D V K L R Y -
CTTCCCCGTGGCGTAGACTAGGAGCCTCCTAGCGGTGTGGTCTACGGGGAGGTCCAGCTCCTTCCTGAG---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R M R G Y R V W D Q A G W D T Q G L P V E L E A
- - - - - - - W D Q A G W D T Q G - - - - - - -
---------------------CCTGGCGAGGCCCTCCAGCATAGTCTCCTC---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E K K L G M R S K R D I E R Y G V D R F I E E C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R R L V D Y Y I E H W E R A S K R L G L W L D Y
- - - - D Y Y I E H W E R A S K R L . . . . D -
------------GGCGAACCTGGCTAGCACGTCAGCTGCCTCCCGCAGCCTCTC------------GGA---
145146147148149150151152153154155156157158159160161162163164165166167168
G H A Y Q T R H P R Y I E A I W E F I K K A H E
- H A Y Q T R H - - - - - - - - - - - - - - - -
---CTTGGCTGCTATAGCGGCGCG------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K G L L Y E G R R V V P R C P R C G T A L S S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E V A Q G Y Q E V D D P S V Y F K L P L E G L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N T Y L V A W T T T P W T I I A N E A A A V H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D E W Y V F I S V G D E I W V V A E K R L E A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A R E V G L E K Y M V V E R V K G A T L A G M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y R H P L A E E V P Y H Q R H E P P Y H T V L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A N W V T M E D G T G V V H L A P A H G P E D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E E C S K R G I E A Y T P L R E D G Y F G P E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G A F K G M W F E D A G E K V I E V L R G K G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L V H A G T V R H E Y P F C W R C G T R L F Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A S R Q W F I R I T D E I R R K M V D G V R S M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R W A P S W A A R R M S D W V E N A R D W C I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R E R Y W G T P L P V W R C T S C G H T V V V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S L E E L R R L A V D P S S V P D D L H R P Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D R V E L R C P K C G G V M R R E P F V V D V W
- - - - - - - - - - - - - - - - - - - - - D V W
---------------------------------------------------------------CCAGTACCG
529530531532533534535536537538539540541542543544545546547548549550551552
M D S G V A H T A A L K Q Y G W L R L W D Q L Y
M D S G V A H T - - - - - - - - - - - - - - - -
CTCGCGGCTTATACACCAGTCGCG------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P Y T W I T E A A D Q T R G W F Y T L L V T G V
- - - W I T E A A D Q T R G . F Y T L L V T G V
---------CGAGCGTACCCCGTCGACCATCTTCCTCCGGAT---GTCCGTTATCCTTATGAACCACTGGCG
577578579580581582583584585586587588589590591592593594595596597598599600
V W H G K A P Y R S V L L Q G H V L D K E G K K
V W - - - - - Y . S V L L Q - - - - - - - - - K
GGACGC---------------GGT---GCAGCGCCAGCAGAA---------------------------GTG
601602603604605606607608609610611612613614615616617618619620621622623624
M S K S K G N V V W A L E W M E K H G A D P M R
M S K S - - - - - - - - - - - - - - - - - - - -
GACTAGGAGCCC------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
M L L L S R A P W D S V N F D P D E V E R Y R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y L N I L W N T V K F A D T Y M E L D K W S P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
P P E P G R L Q A E D R W I I Y R L S Q A L K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V E E A V E N D N M H Q A L Q T L V D L V V E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L S H R Y I P L V R P R V W E E E A T E S K E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A Y A T L Y Y V L R R T I A A M A P F T P F I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E Y L Y Q A F V K K Y E P G A P E S V H M L E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P S V D E K L L D E E S Y L A V E E A L E A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K V L A L R S E R R L K R R W P L R R A A I A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K P G S S L P V E R L R E A A D V L A R F A N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K A V E V V D S E P G W A P R A E K I E T S S M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
T V Y V D M Q L D E E T M L E G L A R E V I R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
A Q V L R K E L D L P V D H T A R R L L V Y A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
G K L R E A V E R H R E L I A R E V R V G S I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
L A S S P P R D G K K W R I E G E E L V L S L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985
P
-
---
Class I
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_ile_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N R F G D E P D Q Y E P A D V E D R V F D Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A A V D A Y E Q T R E H R A D G E D F F F V D G
- - - - - - - - - - - - - - - - - - - F F V D .
---------------------------------------------------------TTCTTCGTCGAC---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P P Y T S G A A H M G H A W N K S L K D A Y I R
P P Y T S G A A H M G H A W N K S L K D A Y I R
CCGCCGTACACGTCGGGCGCCGCCCACATGGGTCACGCCTGGAACAAGAGCCTGAAGGACGCCTACATCCGG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y K R M Q G Y D V T D R P G Y D M H G L P I E T
Y - - - - - - - - T D R P G Y D M H G - - - - -
TAC------------------------ACGGACCGGCCGGGCTACGACATGCACGGG---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K V E E E L G F E S K K D I E E Y G E Q N F I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D C K E F A E E S L A Q L Q S D F Q S F G V W M
- - - - - - E E S L A Q L Q S D F Q S F . . . .
------------------GAGGAGAGCCTCGCGCAACTCCAGTCGGACTTCCAGAGCTTC------------
145146147148149150151152153154155156157158159160161162163164165166167168
D W E N P Y R T I D S S Y M E S A W W A F D Q V
D - - N P Y R T I D - - - - - - - - - - - - - -
GAC------AACCCGTACCGGACCATCGAC------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
H E R D L V E R G K R S I S Q C P R C E T A I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N N E V E Y E D V E D P S I Y V T F D L D D R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G R L V I W T T T P W T I P A N E F V A V D E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T T Y Q K V R A T R D G E E H V L Y L A E E C V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D D V L S V G R Y D D Y E V E E S L Q G S D L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G W S Y T P P L V E E V P A N P A D A E G V H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V Y H G D W V E V D R T G L V H S A P G H G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D F E R G E E L G L P V F C P V G E N G V Y T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E G G K Y A G Q F V R D A N D D I V A D I E A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G A M L A H E T V S H S Y G H C W R C D T G I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q I V T D Q W F I T I T D V K D E L L E N M E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A D W Y P Q W A R D N R F R D F V E N A P D W N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V S R Q R Y W G I P I P I W T P E D W N G E M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
D V L V V G T R E E L A E L A D Q D V D P D T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D L H K D T V D D L T V T K D G T T Y T R V P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V F D V W L D S S V A S W G T L N F P S E T E D
- - D V W L D S S V A S W - - - - - - - - - - -
------GACGTCTGGCTCGACTCCTCGGTGGCGTCGTGG---------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y E E L W P S D L I I E A H D Q T R G W F W S Q
- - - - - - - - L I I E A H D Q T R G . F W S Q
------------------------CTCATCATCGAGGCCCACGACCAGACCCGCGGC---TTCTGGTCGCAA
577578579580581582583584585586587588589590591592593594595596597598599600
L G M G T A A V G E V P Y K N V V M H G H A L M
L G M G T A A - - - - - Y . N V V M H - - - - -
CTCGGCATGGGAACCGCCGCC---------------TAC---AACGTCGTGATGCAC---------------
601602603604605606607608609610611612613614615616617618619620621622623624
P D G R S M S K S K D I R I D P Q E L I D E Y G
- - - - S M S K S - - - - - - - - - - - - - - -
------------TCGATGTCGAAGTCC---------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A D P M R L F V L S V S P R G D D M R V S H D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
V G N L Q S D L N I L W N V F R F P R P Y M E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
D D F D A N V P T G F G G S G D G V S I D D V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L E T V D E W L L S T L Q R V K A D A T E H W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
N Y E Q H R A L E E V L S F V T E D L S R Y Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Q V V R E R M W E T E D S P S K T A A Y A T M Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
R A L L E V T A L L A P Y A P L V T E E L Y Q H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L S G D E G Y D T V H M C D W P A V D E S L R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
P D L E A A V D V L R D V E E A G S H A R Q Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
G R K L R W P V T R I V V D A D T D A V V D A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E A H A D L L R D R L N A R T I E V V E P G E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
W G E L A F S A R A D M S E L G P A F G D D A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
R V M N A L N D A H V E S A D L E A L A T Q V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
E A L G E D V E L T E E M V E F V E E T P E G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
A G A N F E T G T V Y V D T E L T E D V E S E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
Y A R E V I R R V Q E M R K D L D L E M D A E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
R L D V A V F D E R V G R L V A E H E D L I K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
E T R A R E L G D V E D G Y R E E W D V E G V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
L A L E I A E L
- - - - - - - -
------------------------
Class I
Bacteria/Escherichia coli/amino acid sequences/Ecoli_ile_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D Y K S T L N L P E T G F P M R G D L A K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E P G M L A R W T D D D L Y G I I R A A K K G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K T F I L H D G P P Y A N G S I H I G H S V N K
- - - I L H D . P P Y A N G S I H I G H S V N K
---------ATTCTGCATGAT---CCTCCTTATGCGAATGGCAGCATTCATATTGGTCACTCGGTTAACAAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I L K D I I I K S K G L S G Y D S P Y V P G W D
I L K D I I I K S - - - - - - - - P Y V P G W D
ATTCTGAAAGACATTATCATTAAGTCC------------------------CCGTATGTGCCTGGCTGGGAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C H G L P I E L K V E Q E Y G K P G E K F T A A
C H G - - - - - - - - - - - - - - - - - - - - -
TGTCATGGT---------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E F R A K C R E Y A A T Q V D G Q R K D F I R L
- - - - - - - - - - A T Q V D G Q R K D F I R L
------------------------------GCGACCCAGGTTGACGGTCAGCGCAAAGACTTTATCCGTCTG
145146147148149150151152153154155156157158159160161162163164165166167168
G V L G D W S H P Y L T M D F K T E A N I I R A
. . . . D - - H P Y L T M D - - - - - - - - - -
------------GAC------CACCCGTACCTGACCATGGAC------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L G K I I G N G H L H K G A K P V H W C V D C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S A L A E A E V E Y Y D K T S P S I D V A F Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V D Q D A L K T K F G V S N V N G P I S L V I W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T T T P W T L P A N R A I S I A P D F D Y A L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q I D G Q A V I L A K D L V E S V M Q R I G V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D Y T I L G T V K G A E L E L L R F T H P F M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F D V P A I L G D H V T L D A G T G A V H T A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G H G P D D Y V I G Q K Y G L E T A N P V G P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G T Y L P G T Y P T L D G V N V F K A N D I V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A L L Q E K G A L L H V E K M Q H S Y P C C W R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
H K T P I I F R A T P Q W F V S M D Q K G L R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q S L K E I K G V Q W I P D W G Q A R I E S M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A N R P D W C I S R Q R T W G V P M S L F V H K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
D T E E L H P R T L E L M E E V A K R V E V D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I Q A W W D L D A K E I L G D E A D Q Y V K V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D T L D V W F D S G S T H S S V V D V R P E F A
- - - D V W F D S G S T H S - - - - - - - - - -
---------GATGTATGGTTTGACTCCGGATCTACCCACTCT------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G H A A D M Y L E G S D Q H R G W F M S S L M I
- - - - - M Y L E G S D Q H R G . F M S S L M I
---------------ATGTATCTGGAAGGTTCTGACCAGCACCGTGGC---TTCATGTCCTCTCTGATGATC
577578579580581582583584585586587588589590591592593594595596597598599600
S T A M K G K A P Y R Q V L T H G F T V D G Q G
S T A M - - - - - Y . Q V L T H - - - - - - - -
TCTACCGCGATG---------------TAT---CAGGTACTGACCCAC------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R K M S K S I G N T V S P Q D V M N K L G A D I
- K M S K S - - - - - - - - - - - - - - - - - -
---AAGATGTCTAAATCC------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L R L W V A S T D Y T G E M A V S D E I L K R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A D S Y R R I R N T A R F L L A N L N G F D P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
K D M V K P E E M V V L D R W A V G C A K A A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E D I L K A Y E A Y D F H E V V Q R L M R F C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
V E M G S F Y L D I I K D R Q Y T A K A D S V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
R R S C Q T A L Y H I A E A L V R W M A P I L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
F T A D E V W G Y L P G E R E K Y V F T G E W Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E G L F G L A D S E A M N D A F W D E L L K V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G E V N K V I E Q A R A D K K V G G S L E A A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
T L Y A E P E L A A K L T A L G D E L R F V L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
T S G A T V A D Y N D A P A D A Q Q S E V L K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L K V A L S K A E G E K C P R C W H Y T Q D V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
K V A E H A E I C G R C V S N V A G D G E K R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938
F A
- -
------
Class I
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_ile_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F K P V D P N V K F P Q L E E E V L A W W D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N D V V A K S L A A G E K P F V F Y E G P P T A
- - - - - - - - - - - - - - - V F Y E . P P T A
---------------------------------------------GTCTTCTATGAG---CCGCCGACCGCG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N G R P G L H H T I S R S F K D V I L R Y R S M
N G R P G L H H T I S R S F K D V I L R Y - - -
AATGGCCGTCCCGGTCTTCACCATACCATCTCGCGCAGCTTCAAAGATGTGATTTTGCGCTAT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q G Y R I I G R R E G W D T H G L P V E I E I E
- - - - - - G R R E G W D T H G - - - - - - - -
------------------GGTCGCCGCGAAGGCTGGGACACCCACGGC------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K K L G F S G K P D I E R F G I A E F N R L C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E S V W E Y I Q E W K A F T K R I A F W L S E D
- - - W E Y I Q E W K A F T K R I . . . . S - D
---------TGGGAGTACATCCAGGAGTGGAAGGCGTTTACCAAGCGGATC------------AGC---GAT
145146147148149150151152153154155156157158159160161162163164165166167168
A Y I T Y E N D Y I E S T W W I F R Q L W D R G
A Y I T Y E - - - - - - - - - - - - - - - - - -
GCGTATATCACCTACGAG------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L F R D Y K V T M H C P R C G T S L S D H E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S L G A R D D V D D P S V Y I K F R V K G T T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P P P A V D G T L E G A F L V A W T T T P W T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P A N V A L A V K H D A E Y V E V E H N G E R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V M A A T L I N Q V L P A E S F T V L R R F R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N D L V G L R Y E P L F R G V P G A G D T V D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E T A Y R V I A D E I V S L D D G T G I V H I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P A Y G D L E V G R K H G L P T L F S V G L D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R V L P E F A D L G F A G K F F K E A D P D I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R N L K A R G L L L R S G R V R H Y Y P F C W R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
C G T P L L Y Y A K R S W Y I R T T A F K A D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V A N N Q Q I H W V P E H I R D G R F G N W L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N N I D W A I S R E R Y W G T P I P I W T N A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G S H M V C I G S L A E L E E K V G R S L R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D L H R P Y I D E V V W E D P D H G L M R R I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D V A D C W F D S G S M P V A Q W H Y P F E N R
- - - D C W F D S G S M P V - - - - - - - - - -
---------GACTGCTGGTTCGACAGCGGTTCGATGCCGGTG------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D V F E M S H P A D Y I C E A V D Q T R G W F Y
- - - - - - - - - - Y I C E A V D Q T R G . F Y
------------------------------TATATCTGTGAGGCGGTAGACCAGACCCGCGGC---TTCTAC
577578579580581582583584585586587588589590591592593594595596597598599600
T L H A V S T L L F D R P A F K N V I C L G H I
T L H A V S T L L - - - - - F . N V I C L - - -
ACCTTGCACGCGGTCAGTACCCTGCTC---------------TTC---AACGTGATCTGTCTC---------
601602603604605606607608609610611612613614615616617618619620621622623624
L D K D G Q K M S K S R G N V I E P Q E V I N A
- - - - - - K M S K S - - - - - - - - - - - - -
------------------AAGATGAGCAAGAGC---------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y G V D A L R W Y L F T A A P P G N A R R F S M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D L V S E S M R K F L L T L W N T Y A F F V T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A N L D R W Q P N S G R T A E L Q P I D R W A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A A L N Q L V Q T A T A A F E E Y D V Y S A A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A I E H F V D E L S N W Y V R R N R R R F W K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E G D A D K E A A Y Q T L Y T C L V T V A K L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A P F I P F V S E E I Y R N L V A E R D A S A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E S V H L A R W P E V D Q A L L D D Q L V A D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E A L L T A V S L G R A A R K Q A N I K V R Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L S E L W L R A S T P A L L N G V R R F E A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
R D E L N V K V V R Y L D A N S A V V E Y R L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
P N L R L V G K K F G K L V P A I T T A L R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
T G D D A R A A A Q A V E A G Q P V H L S V D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
Q T I E L L A E E V L V E S S A P A G Y A V A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
A D G M L V A L N T T V T E E L R L E G A A R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
L V R Y V Q D A R K S A G L A I S D R I R L F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
S S T D E A A L L A A T L A Q H G A Y I Q N E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
L A V E L T V S A P P A G A H V E T D E F G D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
E I T I G V V K A G
- - - - - - - - - -
------------------------------
Class I
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_ile_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D Y K E T L L L P S T T F A M R A N L A E L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P Q R F K K W F E Q N Y A Y E K M K E N R K N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K K S F T L H D G P P Y A N G H I H I G H A L N
- - - - T L H D . P P Y A N G H I H I G H A L N
------------ATTTTCATTGCT---TTGACTTACCATAAACCAATCGGCTAATTCCTCATTTGGGAATTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K I L K E T I I K T H Y F K G E S V R F T P G W
K I L K E T I I K T - - - - - - - - R F T P G W
ATTAAAACTGATGTTTAAATTTAATTCCAA------------------------TTTAAGTATATCAATTTG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D C H G L P I E Q Q V E V K L G E K K K S L S K
D C H G - - - - - - - - - - - - - - - - - - - -
TTCAAAAAATTT------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K E I R E F C R Q H A S E F V D I Q R E E F K D
- - - - - - - - - - - S E F V D I Q R E E F K D
---------------------------------TTTGATTAAAACATTAGCATGTTCTAGAGCCTCATCTAC
145146147148149150151152153154155156157158159160161162163164165166167168
L G I I A D W D K P Y L T M K F E F E A A I Y R
L . . . . D - - K P Y L T M K - - - - - - - - -
ACT------------TGG------TAAATTTAAAAGCTCTTTTGC---------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T L C E I A K K G L L C E R S K P V F W S W A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K S A L A E A E V E Y Q D K E D Y S I F V A F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L D V K A C E K L G V S K A S A V I W T T T P W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T L V A N Q A I A L N P N E N Y V I T K E G L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F A S A L L K S M V E K G L T S G E I Q K E L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A K E F E K L E A I N P L N G R K S V L I M G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H V L M D G G S G L V H T A P G H G E D D Y Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
C L K Y G I E V L M P V D D S G C Y D E T L R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K G L L P S H L L E E F I G L H I F K A N E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L E L L G E K L L H S S K F I H S Y P F C W R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
H K P V I Y R A T K Q W F I L M D E P K L Q G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T L R E C A K E Q L L K T T F Y P Q S G V K R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G S M V E N R P D W C I S R Q R D W G T P I A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
F R D K N T K E V I F D D E L F D F V A A I F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K H G A D A W W E F E I K D L I P T N S K Y K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E N L E K V Y D I L D V W F D S G S T F N A V L
- - - - - - - - - - D V W F D S G S T F N - - -
------------------------------GGCCTTAAAAATATGAAGACCTATAAACTCTTC---------
553554555556557558559560561562563564565566567568569570571572573574575576
N S G L Y D A G E K R A S M Y L E G S D Q H R G
- - - - - - - - - - - - - M Y L E G S D Q H R G
---------------------------------------ACATCCACTATCATCAACAGGCATTAAAACTTC
577578579580581582583584585586587588589590591592593594595596597598599600
W F Q S S L L V G T A I N E S A P Y E S I L T H
. F Q S S L L V G T A I - - - - - Y . S I L T H
---ACCGTATTTCAAACAAGCATAGTAATCATCTTC---------------AGT---TACAAGTCCACTTCC
601602603604605606607608609610611612613614615616617618619620621622623624
G F T T D E K G Q K M S K S K G N V I A S E Y V
- - - - - - - - - K M S K S - - - - - - - - - -
---------------------------GATTAAAACAGATTT------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A K T Y G V E I L R L W I L L S D Y S S D L K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S D N I L K Q V G E Q Y R K I R N T I R F L L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
N T N D L K D L E V K E F S F I D K W I L S R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
T K V F K A S K E A F F A Y E F A K G F S L L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
N F L S A D L S G I Y L D I S K D R L Y C D S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
N A Q R R K S A Q V A M A L M A K E L L N L L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
P N L S Y S V D E A L E H A N V L I K G D A K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V F D L S L T Q D F D Y D F G I D D T F L M S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R E K F F E Q I D I L K K D K I I K S T L E L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L N I S F N K F P N E E L A D W F M V S Q I S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E N E E I L A E F E V E N E K F K I T K A S L C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
K C P R C W K L Q S K N E E T P C L R C E E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917
K G V Q C
- - - - -
---------------
Class I
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_ile_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A A P Q E K A S A K K A G K N A Y K D T L N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P R T A F A M K A N L V Q S E P Q S V K R W A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L G V Y R Q L R A R A A E A K A A G D P L P A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V A H D G P P Y A N G D I H L G H L L N K V L K
V A H D . P P Y A N G D I H L G H L L N K V L K
GTCGCGCACGAC---CCGCCCTACGCCAACGGCGACATCCACCTGGGCCACCTGCTCAACAAGGTGCTCAAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D L V V R S R S M E G F D C P Y T P G W D C H G
D L V V R S - - - - - - - - P Y T P G W D C H G
GACCTGGTGGTCCGCAGC------------------------CCCTACACGCCCGGCTGGGACTGCCACGGC
121122123124125126127128129130131132133134135136137138139140141142143144
L P I E H R V M Q E L G P G G R E L E P L K I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R K C A A Y A G K H V K T Q R Q Q M E R L L T L
- - - - - - - G K H V K T Q R Q Q M E R L . . .
---------------------GGCAAGCACGTCAAGACGCAGCGTCAGCAGATGGAGCGGCTG---------
169170171172173174175176177178179180181182183184185186187188189190191192
A D Y E N P Y L T M D S R Y E A G V L E V F A G
. D - - N P Y L T M D - - - - - - - - - - - - -
---GAC------AACCCGTACCTCACGATGGAC---------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
M L E A G L V Y R D L K P V H W S V D N Q T A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A E A E L E Y H D R E D T S V Y V R F A M N N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G S E G L L I W T T T P W T L P A N L A V A V H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P R M E Y G L Y E I A G N D P T W I A V A L A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A V A A K R E V G L P G P L K V V K G E A L V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R T Y A H P F V G R E G R V V P A E Y V T D E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G T G L V H T A P G H G A E D Y Q T G L R E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D V Y C P V L P D G T Y D D T V P D W L R G K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I W E A N Q E I V E R L E R D G V L F F D E R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T H S Y P H D W R G K Q P V I F R A T E Q W F C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A V D K P A T G P L A G K T L R Q A G L D A V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K D T S F Q P A W G Q N R L R G M I E S R P D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
C L S R Q R S W G L P I P A F F D A Q G R P L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T A A S V R A V A E V I G D R G S D A W F F L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A A D L L A R Y D P A A D P D A P A W A G D D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L A S L V K G G D T F D V W F E S G S S W H A V
- - - - - - - - - - - D V W F E S G S S W H - -
---------------------------------GACGTCTGGTTCGAGTCCGGCTCCAGCTGGCAC------
577578579580581582583584585586587588589590591592593594595596597598599600
L R E G W R E A Q A E P A S G E A F P A D L Y L
- - - - - - - - - - - - - - - - - - - - - L Y L
---------------------------------------------------------------CTCTACCTG
601602603604605606607608609610611612613614615616617618619620621622623624
E G S D Q H R G W F Q H S L L P A L A V T G R P
E G S D Q H R G . F Q H S L L P A L A V - - - -
GAAGGCAGCGACCAGCACCGCGGC---TTCCAGCACTCGCTGCTCCCGGCGCTCGCCGTC------------
625626627628629630631632633634635636637638639640641642643644645646647648
P F E G V L T H G F M V D R D G R K M S K S L G
- F . G V L T H - - - - - - - - - K M S K S - -
---TTC---GGCGTGCTCACGCAC---------------------------AAGATGAGCAAGTCG------
649650651652653654655656657658659660661662663664665666667668669670671672
N A L E V A T L M Q Q H G A D V C R W W V A S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
N T D N D V K V D E A F F K T A G E A Y R K V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
N T L R F L L S N L D G F R M R G G R V K F E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A D A T S L D A W L T G E L V T L S V S V R R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Y R E N R Y R R A Q E L L F G F C N E T L S G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
Y L S A V K D R L Y C D E A D G R R R R R T Q T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
T L Y R V T T V L V R L L G P I L P H T A D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
W A A L H P D D D E A C V H L C R F A D V A K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A E T P V S E A W P A V M E A R K R W M L A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
Q H R E R A K A C G G A D A P L D L G L V L P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
A E L P E G F D P V E L A D L C G V S R V E V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
E A E E V A V V D L S R Q P R C E R S W K R D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
T V K P R P D N G L L S D R D W R V V S S L H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962
S G
- -
------
Class I
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_ile_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S N K K A D S K P Q A K Y P V N L L D T P F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M R G D L P K R E P Q W V K D W E A R G V Y E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I R A T S Q G R P K F I L H D G P P Y A N G D I
- - - - - - - - - - - I L H D . P P Y A N G D I
---------------------------------GACCGTCGCCGC---CGTGATCAGCACGAACTTCAGGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H L G H A V N K I L K D M V V K S R N M A G F D
H L G H A V N K I L K D M V V K S - - - - - - -
GTCGCCGAGGCTCGCGAGCGCGTCGTAGCGCGCGCCCGACGCGCGCACTTC---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A P Y V P G W D C H G M P I E I Q I E K Q F G K
- P Y V P G W D C H G - - - - - - - - - - - - -
---GATCCGGTTCGCGGCGCGCGCTTCCTCCAG---------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S L P A A E V M A K A R A Y A T E Q I E K Q K A
- - - - - - - - - - - - - - - T E Q I E K Q K A
---------------------------------------------GTAGTAGGTCTCGGTGAAGATCGTCTC
145146147148149150151152153154155156157158159160161162163164165166167168
G F K R L G V L G E W G N P Y K T M N F Q N E A
G F K R L . . . . E - - N P Y K T M N - - - - -
GCTTTGCGGCAGGAA------------TTC------CGTAAACGACAGGAACGGCGC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
E E I R A L G K I I E K G Y V Y R G L K P V N W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C F D C G S A L A E A E V E Y K D R T D P T I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V L F A F A E P E K T A H A F G L A A L P R A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G G I V I W T T T P W T I P A N Q A L N L H P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I V Y A L V D T E R G L L V M A E E R V E A C M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D F G L T G R V V A T T R G D K L A N L R F H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H P L A A A H P G Y K R T S P V Y L G D Y V T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D T G T G I V H S S P A Y G V E D F T S C K A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G M T D S D I I N P V M G D G R Y I E S L P L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G G L T I W D A N P K I V D A L K A A G S L L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N E H Y S H S Y M H C W R H K T P I I Y R A T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q W F A G M D T Q P A D G G K T L R E T A L D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V D A T A F Y P S W G K Q R L H A M I A N R P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
W T L S R Q R Q W G V P M A F F V H K E T G E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H P R T L E L L E E V A K R V E Q Q G I E A W Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T L D A R E L I G D D A N L Y E K N R D T L D V
- - - - - - - - - - - - - - - - - - - - - - D V
------------------------------------------------------------------GATCTT
553554555556557558559560561562563564565566567568569570571572573574575576
W F D S G T T H W H V L R G S H K D Q L Q F P A
W F D S G T T H W - - - - - - - - - - - - - - -
CGGATTCGCGTCCCAGATCGTGAGTCC---------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D L Y L E G S D Q H R G W F H S S L L T A S M L
- L Y L E G S D Q H R G . F H S S L L T A S M L
---GTTGATGATGTCCGAATCGGTCATCCCGTGCGC---GCACGACGTGAAATCCTCGACGCCGTACGCGGG
601602603604605606607608609610611612613614615616617618619620621622623624
D G R A P Y K G L L T H G F T V D G E G R K M S
- - - - - Y . G L L T H - - - - - - - - - K M S
---------------GCC---GCCGGTGTCGGTCGT---------------------------CGTGCGCTT
625626627628629630631632633634635636637638639640641642643644645646647648
K S L G N G I D P H E V A N R L G A E I I R L W
K S - - - - - - - - - - - - - - - - - - - - - -
GTAACC------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I A S T D Y S G E L A I S E E I L K R V T E G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R R I R N T L R F L L A N L S D F D Y A K D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P A E Q W L E I D R Y A V A F S A Q L Q A E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A H Y E K Y E F H P V V A K L Q T F C S E D L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
G F Y L D V L K D R L Y T S A P A S K A R R S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
Q T A L Y H V T Q G L L R V L A P F L S F T A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E A W R V F L P Q S E T I F T E T Y Y A Y P E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A N A D A L V A K W T L L R D V R G N V T K A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E E A R A A N R I G S S L Q A Q V E V R A S G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
R Y D A L A S L G D D L K F V L I T S A A T V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
K V D A Q S D E S V E V A A S K Y Q K C E R C W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
H Y R E D V G A H A D H P T L C G R C F S N L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945
E N G E T R S A A
- - - - - - - - -
---------------------------
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_ile_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E V S A Y K D T L N L L Q T P F N M R A N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P V R E P E I Q Q F W A D R Q I Y E T L S R Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P G A P F V L H D G P P Y A N G A L H M G H A L
- - - - - V L H D . P P Y A N G A L H M G H A L
---------------CGCCTCGGTTAA---CGTGGGTTGATCACGCAATTCCACTTGCGATACCAAGAAGAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N K T L K D I I N K Y Q L L Q G R K V R Y V P G
N K T L K D I I N K Y - - - - - - - - R Y V P G
ATAGCGCAGATCATCGACCGCCGTTCCCGAGAG------------------------CAAGGCAGCCCGCCA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
W D C H G L P I E L K V L Q E L S S E E R R N L
W D C H G - - - - - - - - - - - - - - - - - - -
ATCCGAATCTGCCAC---------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T P L T L R Q K A K A Y A L A Q V E Q Q S Q S F
- - - - - - - - - - - - - L A Q V E Q Q S Q S F
---------------------------------------TTGTTGCCACTTGGCCGCAAGTTCTGGTTGATT
145146147148149150151152153154155156157158159160161162163164165166167168
Q R Y G V W A D W D A P Y L T L T P E Y E A A Q
Q R Y . . . . D - - A P Y L T L T - - - - - - -
CCAGTCATC------------CCA------TTGGAAAACTGATTTTGTCCG---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I D V F G Q M V L K G Y I Y R G L K P V H W S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S S R T A L A E A E L E Y P D G H T S R S I Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A M P I V Q L S E A A Q P L L G N Y A N L A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I W T T T P W T I P A N L A V A V N G E L T Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V V Q A G D C H L I V A A E L A E S L S K T F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T E L T V L A T F P G S V L E H S R Y R H P L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D R E S P V V I G G D Y I T T E S G T G L V H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A P G H G Q D D F I V G N R Y G L E V F C P V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D K G D F T A A V G D R L V G K N V L K D A N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A V I E W L T E V G A L L K E E S Y A H R Y P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D W R T K K P T I F R A T E Q W F A S V E G F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E Q A L Q A I A E V D W I P A Q G E N R I T S M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V S E R S D W C I S R Q R T W G V P I P V F Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E E S G E A L L N A E T I A H V R A I V A E R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S D A W W E L D V A D L L P E P Y R S N G R R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R K G T D T M D V W F D S G S S W A A V A S Q R
- - - - - - - D V W F D S G S S W A - - - - - -
---------------------CGCACGGAAAATCGTCGGCTTTTTGGTGCGCCA------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E G L H Y P A D L Y L E G S D Q H R G W F Q S S
- - - - - - - - L Y L E G S D Q H R G . F Q S S
------------------------CGCGCCGACTTCGGTCAGCCACTCGATGACCGC---ATTGGCATCCTT
577578579580581582583584585586587588589590591592593594595596597598599600
L L T S V A C N G H A P Y R R V L T H G F A L D
L L T S V A C - - - - - Y R . V L T H - - - - -
GAGGACATTTTTGCCCACGAG---------------CGCCGT---GTCGCCCTTGTC---------------
601602603604605606607608609610611612613614615616617618619620621622623624
E K G R K M S K S L G N V V D P A I V I N G G K
- - - - K M S K S - - - - - - - - - - - - - - -
------------GTAACGGTTGCCGAC---------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D Q K Q E P P Y G A D V L R L W V S S V D Y S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D V P I G K N I L K Q M A D V Y R K I R N T A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F L L G N L H D F D P A K D A L P W E K L P E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
D R Y L L H R L R E V I L E I Q D A F E S F Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
F R F F Q T V Q N F C V V D L S N F Y L D I G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D R L Y I S A P D S L R R R S C Q T V L A I C V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E A L A T A I A P V L S H M A E D I W Q S L P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P A R T K S V F Q A G W V Q L Q D D W N Q P E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A A K W Q Q L R D L R S E V N K V L E Q A R R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
Q A I G S S L E A K L Q L W V A D S D W R A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
A D R N P A D S L S G T A V D D L R Y L F L V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
Q V E L R D Q P T G L T E A K Y H A Q T E D W A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
I A V V D A E G Q K C D R C W N Y S T T V G Q S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954
S E H P D L C D R C V S A L Q G T F
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_ile_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K K F A E Y S Q F D L S K V N K D V L K K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D E N Q V F A K S M T E R E G C P S F V F F E G
- - - - - - - - - - - - - - - - - - - V F F E .
---------------------------------------------------------GTATTTTTTGAA---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P P S A N G M P G I H H V M A R S I K D I F C R
P P S A N G M P G I H H V M A R S I K D I F C R
CCTCCATCAGCTAACGGTATGCCGGGTATTCACCACGTAATGGCTCGTTCTATCAAAGATATTTTCTGTCGT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y K T M K G Y Q V K R K A G W D T H G L P V E L
Y - - - - - - - - K R K A G W D T H G - - - - -
TAC------------------------AAACGTAAAGCCGGTTGGGACACACACGGA---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G V E K S L G I T K E D I G K T I S V A E Y N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
H C R Q D V M K F T K E W E D L T H K M G Y W V
- - - - - - M K F T K E W E D L T H K M . . . .
------------------ATGAAGTTTACAAAGGAATGGGAAGACCTGACCCACAAAATG------------
145146147148149150151152153154155156157158159160161162163164165166167168
D M K H P Y I T Y D N R Y I E T L W W L L K Q L
D - - H P Y I T Y D - - - - - - - - - - - - - -
GAT------CATCCATACATTACATATGAT------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y K K G L L Y K G Y T I Q P Y S P A A G T G L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S H E L N Q P G C Y R D V K D T T V V A Q F K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K N P K P E M A Q W G T P Y F L A W T T T P W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L P S N T A L C V G P K I D Y V A V Q S Y N A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T G Q P I T V V L A K A L L N A H F N P K A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L K L E D Y K A G D K L V P F K V I A E Y K G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D L V G M E Y E Q L I P W V N P G E G A F R V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L G D Y V T T E D G T G I V H I A P T F G A D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A Q V A K A A G I P P L Q L V N K K G E L R P M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V D L T G K F Y T L D E L D E D F I K Q R V N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D L Y K E Y A G R F V K N A Y D P N L S D Q D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S L D V S I C M M M K V N N Q A F K I E K H V H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N Y P H C W R T D K P V L Y Y P L D S W F I R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T A C K E R M I E L N K T I N W K P E S T G T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R F G K W L E N L N D W N L S R S R Y W G T P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P I W R T E D N S D E K C I E S V E E L Y N E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E K S V A A G Y M Q S N P Y K D K G F V P G E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N E E N Y N K I D L H R P Y V D D I I L V S K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G K P M K R E A D L I D V W F D S G A M P Y A Q
- - - - - - - - - - - D V W F D S G A M P Y - -
---------------------------------GACGTATGGTTTGATTCGGGCGCAATGCCGTAT------
625626627628629630631632633634635636637638639640641642643644645646647648
I H Y P F E N K E L L D S H Q V Y P A D F I A E
- - - - - - - - - - - - - - - - - - - - F I A E
------------------------------------------------------------TTTATAGCGGAA
649650651652653654655656657658659660661662663664665666667668669670671672
G V D Q T R G W F F T L H A I A T M V F D S V S
G V D Q T R G . F F T L H A I A T M V - - - - -
GGAGTAGACCAAACTCGCGGA---TTCTTTACTTTACATGCCATTGCAACAATGGTA---------------
673674675676677678679680681682683684685686687688689690691692693694695696
Y K A V I S N G L V L D K N G N K M S K R L G N
Y . A V I S N - - - - - - - - - K M S K R - - -
TAT---GCTGTTATTTCCAAT---------------------------AAGATGTCTAAACGT---------
697698699700701702703704705706707708709710711712713714715716717718719720
A V D P F S T I E Q Y G S D P L R W Y M I T N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S P W D N L K F D V D G I E E V R R K F F G T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Y N T Y S F F A L Y A N V D G F E Y K E A D L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
M N E R P E I D R W I L S V L N T L V K E V D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
C Y N E Y E P T K A G R L I S D F V N D N L S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
W Y V R L N R K R F W G G G F T Q D K L S A Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
T L Y T C L E T V A K L M A P I A P F Y A D R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
Y S D L I G V T G R D N V V S V H L A K F P E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
N E K M V D K E L E A Q M Q M A Q D V T S M V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
A L R R K V N I K V R Q P L Q C I M I P V V D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
V Q K A H I E A V K A L I M S E V N V K E I K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
V D G A A G V L V K K V K C D F K K L G P K F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
K Q M K A V A A A V A E M S Q E A I A E L E K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
G K Y T F D L G G A E A V I E S A D V E I F S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
D I P G W L V A N E G K L T V A L E V T V T D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
L R R E G I A R E L V N R I Q N I R K S S G F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
010611062106310641065106610671068106910701071107210731074107510761077107
I T D K I K L T L S K N P Q T D D A V N E Y N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
810791080108110821083108410851086108710881089109010911092109310941095109
Y I C N Q V L G T S L T L A D E V K D G T E L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610971098109911001101110211031104110511061107110811091110111111121113111
F D D F S L F V N V V K E
- - - - - - - - - - - - -
---------------------------------------
Class I
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_ile_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D Y K E T L L M P Q T E F P M R G N L P K R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P E M Q K K W E E M D I Y R K V Q E R T K G R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F V L H D G P P Y A N G D I H M G H A L N K I
- - V L H D . P P Y A N G D I H M G H A L N K I
------CCGCTCGGCTTC---CGGCGCGGCGTCATACGGCTCATCGGCGATCGAAAAGGCGGAAACGATGAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L K D I I V R Y K S M S G Y C A P Y V P G W D T
L K D I I V R Y - - - - - - - - P Y V P G W D T
AAGCTGGCGCAAGTCGGCATCAAG------------------------GTCTTTCGGGTAGACGATGACGCT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H G L P I E T A L A K Q G V D R K S M S V A E F
H G - - - - - - - - - - - - - - - - - - - - - -
CGCGGT------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R K L C E Q Y A Y E Q I D N Q R R Q F K R L G V
- - - - - - - - Y E Q I D N Q R R Q F K R L . .
------------------------AAGCAGCTCTTCTTCGCCGTCGATCGCGATCGGCTCCGGCAT------
145146147148149150151152153154155156157158159160161162163164165166167168
R G D W D N P Y I T L K P E Y E A Q Q I K V F G
. . D - - N P Y I T L K - - - - - - - - - - - -
------GAC------GACGTTTTCTCTTCGATTCGG------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E M A K K G L I Y K G L K P V Y W S P S S E S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L A E A E I E Y K D K R S P S I Y V A F P V K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G K G V L E G D E R I V I W T T T P W T I P A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L A I A V H P E L D Y H V V E T N G Q K Y V V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A A L V E S V A N E V G W D A W S V V K T V K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N E L E Y V V A K H P F Y E R D S L V V C G E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V T T D A G T G C V H T A P G H G E D D F L V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q K Y G L P V L C P V D E R G Y M T S E A P G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E G M F Y E D A N K A I T Q K L E E A G A L L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L G F I T H S Y P H D W R T K Q P T I F R A T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q W F A S I D K I R S E L L Q A I K D T K W I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E W G E I R I H N M V R D R G D W C I S R Q R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
W G V P I P V F Y G E N G E P I I T D E T I E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V S N L F R Q Y G S N V W F E R E A K D L L P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G F T H P S S P N G I F T K E T D I M D V W F D
- - - - - - - - - - - - - - - - - - - D V W F D
---------------------------------------------------------CGTTGGCTGCTTCGT
529530531532533534535536537538539540541542543544545546547548549550551552
S G S S H Q A V L V E R D D L A R P A D L Y L E
S G S S H Q - - - - - - - - - - - - - - L Y L E
CCGCCAGTCGTGCGGATA------------------------------------------CTCAAGCTTCTG
553554555556557558559560561562563564565566567568569570571572573574575576
G S D Q Y R G W F N S S L S T A V A V T G K A P
G S D Q Y R G . F N S S L S T A V A V - - - - -
TGTAATCGCCTTGTTGGCGTC---GTAAAACATTCCTTCAAACCCCGGCGCTTCGCT---------------
577578579580581582583584585586587588589590591592593594595596597598599600
Y K G V L S H G F V L D G E G R K M S K S L G N
Y . G V L S H - - - - - - - - - K M S K S - - -
CTC---GACCGGGCAAAGAAC---------------------------AAAGTCGTCTTCCCC---------
601602603604605606607608609610611612613614615616617618619620621622623624
V V V P A K V M E Q L G A D I L R L W V A S V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y Q A D V R I S D N I L K Q V S E V Y R K I R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
T F R F M L G N L F D F D P N Q N A V P I G E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G E V D R Y M L A K L N K L I A K V K K A Y D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Y D F A A V Y H E M N H F C T V E L S A F Y L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
M A K D I L Y I E A A D S R A R R A V Q T V L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E T V V A L A K L I A P I L P H T A D E V W E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I P N R R E N V E S V Q L T D M P E P I A I D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E E E L L S K W D A F M D V R D D I F K A L E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A R N E K V I G K S L T A S V I V Y P K D E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K L L A S L D A D L R Q L L I V S A F S I A D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
P Y D A A P A E A E R L D H V A V L V R P A E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
E T C E R C W T V T K E V G A D P S H P T L C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924
R C A H I V N E H Y S A
- - - - - - - - - - - -
------------------------------------
Class I
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_ile_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A F A A V D P K V S F P T L E D E I A A W W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A H G I V K K T L D H G D A S R P F V F F E G P
- - - - - - - - - - - - - - - - - - V F F E . P
------------------------------------------------------GGCATATTCAGC---GAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P T A N G R P G I H H V E A R S S K D I M V R F
P T A N G R P G I H H V E A R S S K D I M V R F
TGCCGCCAAATCAACCTCGGTTCCCAAGGTTGCATTGATACGATCGGTGATCGCTAGATCAGCGGCCTTACG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N R M L G K K V I G A R G G W D T H G L P V E L
- - - - - - - - - G A R G G W D T H G - - - - -
---------------------------GCGGGCGATGCCTTCGCGCAGCAATTCATC---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E V E K K L G F A G K P D I E K Y G I T E F N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A C R Q S V W D Y I Q E W E K L T Q R I A F W I
- - - - - - W D Y I Q E W E K L T Q R I . . . .
------------------TGTTTCGCCTTCGACTACAACCTCGAAGCTGGCCCCGGTTTC------------
145146147148149150151152153154155156157158159160161162163164165166167168
D L E D P Y I T Y D N K Y I E S L W W I F K Q L
D - - D P Y I T Y D - - - - - - - - - - - - - -
TGC------GGCTTGCTCGCTGCTAAGATT------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
H E R E L L Y R D Y K V T M H C P R C G T S L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D H E V A Q G Y Q D N T D D P S V W V R F R H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P S D H A L D A Q V A D A A F L A W T T T P W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L P A N A G L A V N P E A T Y V L A E H E G Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y I L A E A L V G A V L G E T A A T L A S F V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A D L R G L R Y T P L F P G V G D N G A A I D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S S A Y R V V A D E F V S L E D G T G I V H I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P A Y G D L E I G R K Y G L P T L F S V E L A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K V L G S F E S F G F A G M F F K E A D P K I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R Y L K E Q G L L F K S G R V L H T Y P F C W R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
C K T P L L F Y A K Q S W Y I R T T A L K Q Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I A N N K K I N W V P E H I Q A G R F G N W L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N N I D W A I S R E R Y W G T P L P V W T C D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
C Q H I D V V G S L A E L G E R W G Q D T A N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D M H R P F V D A P S W S C P E C E A G T M Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I P D V A D C W F D S G A M P V A Q W H Y P F E
- - - - - D C W F D S G A M P V - - - - - - - -
---------------AATGCGCTGCATCGTGCCAGCTTCGCACTCAGG------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
N Q E L F E V A G Q A D F I S E A I D Q T R G W
- - - - - - - - - - - - F I S E A I D Q T R G .
------------------------------------ACCCCAACGTTCGCCAAGCTCCGCCAACGAACC---
577578579580581582583584585586587588589590591592593594595596597598599600
F Y T L H A V S T L L F D R P A Y K N V I C L G
F Y T L H A V S T L L - - - - - Y . N V I C L -
CACATCGATATGCTGACAGGTATCGCATGTCCA---------------GCC---ATAGCGCTCACGGCT---
601602603604605606607608609610611612613614615616617618619620621622623624
H L L D G K G E K M S K S K G N I V S P W E M V
- - - - - - - - K M S K S - - - - - - - - - - -
------------------------CCAGTTGCCAAAACG---------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E K Y G A D A V R W Y M F A A G Q P Y N P R R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S A D L V S E S L R Q F L L T L W N T Y S F F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
T Y A N V D G W T P E L A Q G D L A A I D R W A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L A R L N A L V R D V R N D L S N Y D M N T P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
K R L E Q F V D E L S N W Y V R R N R R R F W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S D M N G D K Q A A Y S T L Y T C L V T I S K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
M A P F T P F V A E S L Y Q N L V R S Y D Q T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A E S V H M A L Y P E A N L A L I D E E L I R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
T D L L L K A V S L G R A A R K N A G I R V R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
P L S E V L V R L P R G E Q L D E L S A E L S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E L N I K S V R W L G V G D G L V S Y R F K P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L R S V G K K F G K L V P A L R E V L A N L S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
E Q A A D A A H K V E T G A S F E V V V E G E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
L T L A A D D V L M E A S S P E G Y A V A E G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
G L L V A L V T T L T D E L L R E G I A R E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
R N L N D A R K A A D L A I T D R I N A T L G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
E V D L A A V V A E Y A E Y I K A E T L C E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
S V G D A N A D H H T S S M E L E Q G K L S L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
I S K I G
- - - - -
---------------
Class I
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_ile_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E Y K N T L N L P K T S F P M K A N L V N K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K V F L E E W E K M D L Y N Y V L E Q R K G K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F V L H D G P P Y A N G H I H I G T A L N K I
- - V L H D . P P Y A N G H I H I G T A L N K I
------GTCCTGCACGAT---CCCCCTTACGCAAACGGTCACATCCACATTGGAACGGCCCTGAACAAGATT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L K D I V V K Y K T M R G Y R A P Y V P G W D T
L K D I V V K Y - - - - - - - - P Y V P G W D T
CTGAAGGACATCGTCGTCAAATAC------------------------CCGTACGTTCCTGGCTGGGACACC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H G L P I E H R V S Q E L G E K I K E M S P A E
H G - - - - - - - - - - - - - - - - - - - - - -
CACGGT------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I R K K C E E F A L R F V D I Q R E E F K R L G
- - - - - - - - - L R F V D I Q R E E F K R L .
---------------------------CTCAGATTCGTTGATATACAGAGAGAAGAATTTAAAAGACTC---
145146147148149150151152153154155156157158159160161162163164165166167168
V R G D W E N P Y I T L K P D Y E V K I L D V F
. . . D - - N P Y I T L K - - - - - - - - - - -
---------GAC------AATCCATACATCACGTTGAAG---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K T L V E Q G N V Y R S L K P I Y W C P R C R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A L A E A E I E Y H D H K S P S I Y V K F R S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E D P N F F I V I W T T T P W T L P A N V G I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L H P D Y E Y S V V K V G E E K W V I A T D L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D A F S K E T G I D C S N V V E K I K G K D L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G K E F V H P I F D D R T S R V I L A D Y V S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E T G T G C V H I A P G H G E E D Y I Y G H V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y G L P I V S P V D E E G R F T E E A G K Y K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
M F I E D A N E V I I E D L K R K G I L V H A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S I T H S Y P H C W R C K G P V I F R A T E Q W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F I S V D H N N L R Q K V L E E I D K V K W I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E W G R N R I R S M V E E R P D W C I S R Q R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
W G T P I P A V K C K E C G E V V L D P K V I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
H F M K I V E K E G T N A W F E K E V E E L I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E D F V C P K C G K R S F E K M L D T L D V W I
- - - - - - - - - - - - - - - - - - - - D V W I
------------------------------------------------------------GACGTATGGATA
529530531532533534535536537538539540541542543544545546547548549550551552
D S G A S F E Y I T T K R E D H P F P L D M Y L
D S G A S F E - - - - - - - - - - - - - - M Y L
GATTCTGGTGCCTCCTTCGAA------------------------------------------ATGTACCTT
553554555556557558559560561562563564565566567568569570571572573574575576
E G S D Q H R G W F H S S I F L A V A K R G S A
E G S D Q H R G . F H S S I F L A V A K - - - -
GAAGGTAGCGATCAGCACAGGGGA---TTCCATTCTTCCATCTTCCTTGCCGTCGCAAAG------------
577578579580581582583584585586587588589590591592593594595596597598599600
P Y K E V L T H G F I K D E Q G R K M S K S L G
- Y . E V L T H - - - - - - - - - K M S K S - -
---TAC---GAAGTGCTAACACAC---------------------------AAGATGAGCAAGTCC------
601602603604605606607608609610611612613614615616617618619620621622623624
N V V D P M E V V E K Y G A E I L R L W L A S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D Y F N D I K I S M R I V E Q Q T E V Y R K I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
N T F R F L L G N L E D F D P E L D R V P H E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L L T I D R W A L G R L Q E I I K R A T E Y Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
S Y E F S K V Y N L V V K Y C T T E L S S L Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D V V K D R L Y V E A K D S I Y R R S A Q T V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
H E I L I S L M K I L A P I M T F T M E E V Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
H L H E K D R K Y K T V Q A E Y W P E Y R E E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
I D R K L M E D F E K L L S I R E D V L K A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E K R Q Q D V I G H S L D A E V V L V P K N D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
I K A L L E K Y R D I L E E L F I V S K V S L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
D A S G E L K G E L V E V T V K H A E G E K C Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
R C W K Y T T E I S A S E D F P G V C P R C L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919
V L K G E R K
- - - - - - -
---------------------
Class I
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_ile_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E E K K V D L K D T L N L P R T E F P M K A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L P Q R E P Q I L E K W K G L Y E K I Q K E R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G R E V F V L H D G P P Y A N G H I H V G H A L
- - - - - V L H D . P P Y A N G H I H V G H A L
---------------TCCTTCTATCTG---TTCTCCTCCCTCTCTCAGCTCAACCTGACTGACCGTAAAGAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N K I L K D V I N K Y N L L I G K N V N F I P G
N K I L K D V I N K Y - - - - - - - - N F I P G
GAAGTTCAGGTAATCCTCGTACTTTTTAAGGAG------------------------TATGTAAACCTTTGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
W D C H G L P I E R A V E K E L S K K K I K K E
W D C H G - - - - - - - - - - - - - - - - - - -
TTCGTAAGGGTGCTT---------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S L P K T E F R E L C R E Y A K K Y V N I Q R E
- - - - - - - - - - - - - - - K K Y V N I Q R E
---------------------------------------------ATTCTCATCGGGCTTTGGCATTTCGTA
145146147148149150151152153154155156157158159160161162163164165166167168
D F V R L G V L G D W E H P Y L T M D P K Y E A
D F V R L . . . . D - - H P Y L T M D - - - - -
GAGGAATACGCTCTC------------GTC------CCCTACGTGCTCCCATAGCTC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q E I R E L G K F F E R G L A Y R S K K P V Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C I Y D K T A E A E A E V E Y Y E K E D P S I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V K F P L K S G E K F G I K D K K V F A I I W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T T P W T L P A N L G I M V K E D A D Y V L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V E D E V W I V A K E L M D K F F E T V N R P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G L V L E T V K G K D L V G L E Y T H P F V E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E K L K G H L S E E T L K N M W K I Y P S E F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S L D T G T G L V H M A P G H G Q E D Y V V G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R Y G L E P Y A P V S D E G R F V E P A P E F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I N V R V F D A N H L I V G V L K E K G F L V H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E E K I R H S Y P H C W R C K N P V I F R A T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q W F I G M D I E F F G K T L R Q R A L E E I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K V K W I P E Y G K N R I K S M V E N R P D W C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I S R Q R F W G V P I T V F Y C E N C G E I I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D R E V F E R V A Q L V E N S E K G S D V W F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L T S S Q L L P E G Y K C P K C G G D S F T K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E D I L D V W F D S G C S H A A V I R P L G F Q
- - - - D V W F D S G C S H A - - - - - - - - -
------------TTTCAGAACTCCTACGATTAAGTGGTTTGCGTC---------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K A D L Y L E G S D Q H R G W F Q A S L L E S V
- - - L Y L E G S D Q H R G . F Q A S L L E S V
---------TTCTACAAACCTCCCCTCGTCGCTGACGGGTGC---GGGCTCAAGTCCGTACCTCTGACCGAC
601602603604605606607608609610611612613614615616617618619620621622623624
G S Y L E A P Y K A V L T H G F I V D E K G R K
G S - - - - - Y . A V L T H - - - - - - - - - K
TACGTA---------------TCC---AGCCATGTGAACGAG---------------------------TTC
625626627628629630631632633634635636637638639640641642643644645646647648
M S K S L G N V I S P Q E V V K E F G A D I L R
M S K S - - - - - - - - - - - - - - - - - - - -
CGAGGGGTATAT------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L W V V S E D Y T E D V K L G K N L L K K I A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
D Y R K I R N T L R F I I G N L Y D F N P R T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A L P F E K L H H F D R W I I S E L Q N L L K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
V H E N Y E K F L F Y R V H N H I K N F V I T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L S A I Y L D V L K D R L Y V Y A P A S W E R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S A Q T A L W H L L I A L T T S T A P Y L S F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A E E L W E H V G K L D P S L P E S V F L Y E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
P K P D E N L K D E E V L K D Y E I L L K V R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E V M R A L E V A R K E K G I I K H P Y E A K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
Y I R G D E S V E S L L K K Y E D Y L N F F F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
V S Q V E L R E G G E V Q I E G E E L P V K V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
V N K A E G E K C P R C W I Y Y Q K E E F V G C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956
V C K R C A K A L S E M G I E L N A V C
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_ile_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K N K Y K E T L N I P Q D V L P M R A N L I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K E L K F K T F W D Q N K I Y Q K A L E K N K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N K P F I L H D G P P Y A N G D L H I G H A L N
- - - - I L H D . P P Y A N G D L H I G H A L N
------------TAATGTTTTTAA---TTCATCAGTTTCTTTTATGTAAACTAATGCTTGATTTGCGCTTTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K I L K D I V V R Y K S L S G F Y A P F V P G W
K I L K D I V V R Y - - - - - - - - P F V P G W
AATAAGTTTGTCTTTAATTGCTATTTCAAT------------------------TTCAAAAAAGGAATTTCA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D T H G L P I E N K I L K E L K I D D H K N I S
D T H G - - - - - - - - - - - - - - - - - - - -
CTTTTCTTCTTG------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T L E L R K Q A R E Y A L S Q I K N Q K K Q F L
- - - - - - - - - - - - L S Q I K N Q K K Q F L
------------------------------------AGTTGGTAAAATTGGAGCTAAAATTAATAATAAAGT
145146147148149150151152153154155156157158159160161162163164165166167168
T M Q L F S D F K D Y Y Q T L D P K F E A E Q L
T M . . . . D - - D Y Y Q T L D - - - - - - - -
TTTTGT------------ATT------AATCATTTTTCTTTGTAAATC------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K V F K K M A L D G L I Y K S L Q P V F W S P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S Q S A L A E A E V E Y H E H K S H S I Y T A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K I V K G N K F V E K N D F L V I W T T T P W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L I A N S G V S V K E E F S Y S K I N Y E N K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y I F A T D L V Q K V T E I F G W K N F K I I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S F Q G K D L V G I E Y Q R P I K Q E K T A P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V L G H H V T L E S G S G L V H M A P L F G L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D F I I G R V E K L E E I M H I N D D G S I N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F G N Q F A N K F Y W D A N P E I N E F L K Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N L L L H H S F L Y H S Y P H D W R T N K P V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y R G S N Q W F V S I D P I K E K I T K S I E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V E S Y P T W G I S R L K T M I D N R T S W T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S R Q R A W G V P I P I F Y N E K N E P V F E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E L F D H I I D L V S K Y G T D I W F E K S T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E L L P E K Y K N K N W T K E K D I M D V W F D
- - - - - - - - - - - - - - - - - - - D V W F D
---------------------------------------------------------ATTGCCAAATTCATT
529530531532533534535536537538539540541542543544545546547548549550551552
S G T T S M G V K I E G A P V P W D V Y L E G S
S G T T S M - - - - - - - - - - - - V Y L E G S
AATACTTCCATCATCATT------------------------------------AATGATAAAATCATCCAA
553554555556557558559560561562563564565566567568569570571572573574575576
D Q Y R G W F N S S L I N S V V Y Y N Q A P F K
D Q Y R G . F N S S L I N S V V Y - - - - - F K
TCCAAAAAGAGGTGC---ATGAACTAGACCAGATCCTGATTCTAAAGTTAC---------------AATAGG
577578579580581582583584585586587588589590591592593594595596597598599600
K L V S H G F V L D E K G N K M S K S K G N V V
. L V S H - - - - - - - - - K M S K S - - - - -
---TGTTTTTTCTTG---------------------------TACTAAATCTTTACC---------------
601602603604605606607608609610611612613614615616617618619620621622623624
L P Q E I I S K F G A D I L R L W V A N S E Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S D V T I G E N I I N Q N V E I Y R K F R N T F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
R F L I A N L V D F D Y K K D L K E L T G I H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L I K E Q L E T L K F N T K I A Y E N F Q F T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V I K L T N N F V Y N L S S F Y L D F S K D I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Y A N K I E D L Q R K M I Q T N F Y N I T K T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L L I L A P I L P T T I E E V Y Q I F D Q A N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
K E S V H L E N F F G I S S I E T I Q E E K W N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
S F F E L K N K V Y A L I E I A I K D K L I K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A N Q A L V Y I K E T D E F L K T L D L K N L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
M V G K V I F S K E N K I E N Y E G H L C E R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885
R I Y F D F I D K D N L C V R C S K V I L
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_ile_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T E L G S Y K D T V N L P K T K F D M R A N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T K R E P E I Q K F W A E N Q I Y D R L S Q Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S G E I F T L H D G P P Y A N G S L H I G H A L
- - - - - T L H D . P P Y A N G S L H I G H A L
---------------CAATTCTGTTAG---TGCGGGAGTATCGAGCAATTCTACCCCAGAAGTGATGAATAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N K I L K D I I N R Y Q L Q Q G R K V R C I H G
N K I L K D I I N R Y - - - - - - - - R C I H G
ATAGCGTAACTCATCAACACCGTTGGAATGAGT------------------------GTTTAAAAATTGCAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
W D C H G L P I E L K V I Q S M K P Q E R A S L
W D C H G - - - - - - - - - - - - - - - - - - -
GCGTTGTCGCAAATT---------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T P L E L R H K A R D F A L K A M Q E Q C A S L
- - - - - - - - - - - - - L K A M Q E Q C A S L
---------------------------------------GAGTTGGCGCAACTGAACCCAAGATTCTGCCAG
145146147148149150151152153154155156157158159160161162163164165166167168
K R W G V I G D W E N S Y L T L K P K Y E A A Q
K R W . . . . D - - N S Y L T L K - - - - - - -
CTCTGAATT------------CTC------CACCCAGCCGGATTCAAATAC---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I G V F G Q M V L K G Y V Y R G F K P V Y W S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S S K T A L A E A E L E Y P E G H T S R S L Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A F P M T H I E P S V F P K L K S F L P H L W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A I W T T T P W T I P A N L A V A V N P D L T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A V V E M S R K D A E T Q S T L S A F A S L R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q N P Q Y L I V A A D L V E R L S V T L G A Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T V K A T F K G Y E L E H C K Y R H P L C D R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S P I V I G G D Y V T T E S G T G L V H T A P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H G Q E D Y Q V G M R Y N L P I L S P V D A D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N F T A E A G Q F A K L N V L G E G N A A V V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A L E Q A G S L L K E E P Y V H K Y P Y D W R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K K P V I L R A T E Q W F A S V E G F R D A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q E I A H V R W I P A Q G E N R I T A M V A E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S D W C I S R Q R S W G V P I P V F Y D E E T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E P L L N E E T I A R V Q N I F A E K G S D A W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
W E M S V E E L L P E K Y R D N G R K Y R K G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D T M D V W F D S G S S W A A V L Q Q R P E L S
- - - D V W F D S G S S W A - - - - - - - - - -
---------GTGGACGTATGGTTCTTCCTTCAGCAGCGAACC------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Y P A D L Y L E G S D Q H R G W F Q S S L L T S
- - - - L Y L E G S D Q H R G . F Q S S L L T S
------------TAATACGTTAAGCTTGGCAAATTGTCCGGCTTC---TGTAAAGTTACCATCGGCATCGAC
601602603604605606607608609610611612613614615616617618619620621622623624
V A T N G H A P Y K T V L T H G Y T V D E Q G R
V A T - - - - - Y . T V L T H - - - - - - - - -
GGGAGAGAG---------------GCG---CCCCACTTGATAATC---------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K M S K S L G N G V D P T V V I D G G K N Q K E
K M S K S - - - - - - - - - - - - - - - - - - -
GACGAGTCCCGTACC---------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E P P Y G A D V L R L W V S S V D Y S A D V P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S K N I L K Q L A D A R N K I R N T A R F L L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
N L H D F D P S K D A V P Y E Q L P E L D R Y M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L H R M T E V F N E V T Q A F D K Y Q F F R F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Q T V Q N F C V V D L S S F Y L D I A K D R L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I S A A N S F R R R S C Q T V L Q I A L E N L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K A I A P V L C H M A E D I W Q Y L P Y P K S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E S V F E S G W V K L E D K W Q N S E L A E S W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V Q L R Q L R T E V N K V L E Q A R T E K A I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
S S L E A K V L L Y V A D A N L R Q R L Q F L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
P S T D A Q P S T H S N G V D E L R Y L F I T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
G V E L L D T P A T L T E L K Y N F Q S E A L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
I G V A K A D G K K C D R C W N Y S I H V G A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978
Q A H P L L C E R C I P A L A G E F
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_ile_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K Y P E Y K Q L D L V Q V A Q E I N E F W Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N H D I F L E S I K N R E G K P S F T F Y E G P
- - - - - - - - - - - - - - - - - - T F Y E . P
------------------------------------------------------CGTTTGGTATAC---AAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P S A N G E P G I H H V L S R A L K D L F C R Y
P S A N G E P G I H H V L S R A L K D L F C R Y
TGCTTCTTTTACAAAGTCTTCTTGAGAAGCTATAGCGAGCTGTATCTTATCCTGTACTTCTAAGCCCATAGA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K T L Q G Y Q V K R K S G W D T H G L P V E L Q
- - - - - - - - K R K S G W D T H G - - - - - -
------------------------TATTACGTCTCTGGCAACACCTTCTTGTCG------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V E K S L G I T K E E I G K R I S I E E Y N A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
C R Q T V M R Y T D Q W E K L T T E L G Y W L D
- - - - - M R Y T D Q W E K L T T E L . . . . D
---------------AAGTCTGATCATATCTTTACCTATATTGAGCATTAATTCTTG------------TAA
145146147148149150151152153154155156157158159160161162163164165166167168
T E N P Y I T Y D R Q Y I E S V W Y L L K Q L Y
- - N P Y I T Y D - - - - - - - - - - - - - - -
------ATCTTCTTGAGTAAGCGTAGT---------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S K G L L Y K G Y S I Q P Y S P A A G T G L S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
H E L N Q P G C Y R S V K D V T V V A Q F K L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N A E Q D Y V L A W T T T P W T L P A N S A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I G E N I T Y V K V R T Y N P Y T H Q L V Q V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L A E A A L A R Y F T T S P D R E A V A H Y Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G A S T I P W E I I A K Y Q G K D L V G L E Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q L L P Y V Q P V N H T F R I V S G D F V T T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E G T G I V H I A P T F G A D D M R L A Q K S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I P A I T V E R D G K A V P I V D K Q G R F V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I T D W A G K Y V K E D Y E P E N I R N Q P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y K S A D V L I A I K L K Q E N K A F L V A K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E H N Y P H C W R T D K P I L Y Y P L D A W F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R T T A Y K D R L I A L N K T I N W K P A S T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T G R F E N W L E N L V D W N L S R D R F W G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P L P I W R T E D G Q E E L C I G S I Q E L N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E V E K S I A A G F M E H P L P I D F D L H R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y V D N I V L A S P S G K E M H R T T D L I D V
- - - - - - - - - - - - - - - - - - - - - - D V
------------------------------------------------------------------TGCTAT
577578579580581582583584585586587588589590591592593594595596597598599600
W F D S G A M P Y A Q W H Y P F E N K E T F Q Q
W F D S G A M P Y - - - - - - - - - - - - - - -
GGATTTTTCTACTTCTTGGTTGAGTTC---------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
S F P A D F I A E G V D Q T R G W F F T L H A I
- - - - - F I A E G V D Q T R G . F F T L H A I
---------------AGTACCCCAAAATCGATCACGACTCAAATTCCA---CACTAGATTTTCTAGCCAGTT
625626627628629630631632633634635636637638639640641642643644645646647648
A V M L F D S V A F K N V V S N G L I L D K I G
A V M L - - - - - F . N V V S N - - - - - - - -
TTCAAAGCGGCC---------------GGG---CCAATTGATTGTTTT------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
N K M S K R L G N S I D P F Q I M Q Q H G P D A
- K M S K R - - - - - - - - - - - - - - - - - -
---AGCTGTAGTACGGAT------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L R W Y M I S N A N P W D N L K F D T E G L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V T R K F F S T L Q N T Y S F F A L Y A N L D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
F F F N K Q S N I P L K G R P E I D R W I L S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L H S L I Q F V T T E L D A Y E P T R A C R A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
Q D F V V D D L S N W Y V R L N R K R F W K S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
Q T Q D K T A A Y Q T L Y T C L T T V V Q L A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
P I A P F Y T E R M Y K D L Q L V Q Q E D K T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S I H L S D W P V V N T S A I N L A L E A K M Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
Q A Q T I V S L V H S L R K K H N L K V R Q P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
T K L I V P V T N E A M Q A Q I E A V A D L I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
A E T N I K Q I T Y I A H T S E L V A K K V K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
N F K Q L G Q R Y K A Q I K P I T E A L T T L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
Q E D I L L L E A H Q E L M L N I G K D M I R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
S L E D V M I I S E D I P G W S V A S Q E S I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
V A L D I T V T D A L R Q E G V A R D V I N R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
Q N M R K S M G L E V Q D K I Q L A I A S Q E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
F V K E A V T V Y Q T Y I C Q E T Q A L Q F T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
010611062106310641065106610671068106910701071107210731074107510761077107
L E S L T K G E Q V E I D N Y V L Q I N V K L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
810791080108110821083108410851086108710881089109010911092109310941095109
T A G Q
- - - -
------------
Class I
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_ile_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D Y K D T L L M P K T D F P M R G N L P N R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P E I Q G K W E D M D I Y S L V Q K R T E G R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M F V L H D G P P Y A N G D I H M G H A L N K V
- - V L H D . P P Y A N G D I H M G H A L N K V
------GTGCTTCATGAC---CCGCCGTATGCGAACGGCGATATTCATATGGGGCATGCGCTTAACAAAGTA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L K D F I V R S R S M S G Y H A P Y V P G W D T
L K D F I V R S - - - - - - - - P Y V P G W D T
CTGAAGGATTTCATCGTCCGTTCG------------------------CCGTACGTTCCGGGCTGGGACACA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H G L P I E T A L T K N K K V K R K E M T V A E
H G - - - - - - - - - - - - - - - - - - - - - -
CACGGC------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F R K L C E E Y A W Q Q I E G Q K T Q F K R L G
- - - - - - - - - W Q Q I E G Q K T Q F K R L .
---------------------------TGGCAGCAAATCGAAGGCCAAAAAGCGCAATTTAAGCGGCTC---
145146147148149150151152153154155156157158159160161162163164165166167168
V R G D W E N P Y V T L K P E F E A Q Q I K V F
. . . D - - N P Y V T L K - - - - - - - - - - -
---------GAT------AATCCATACGTGACGCTTAAG---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G E M A K K G Y I Y K G K K P V Y W S P S S E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A L A E A E I E Y H D K R S P S I Y V A F D V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D G K G V L T N G E K I V I W T T T P W T I P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N L G I A V H P E L E Y S V V A A G G A R Y V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A S A L I E S V A K A I G F E D H E V V Q T V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G K D L E H I V A V H P L Y G R D S L V M L G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H V T T D A G T G C V H T A P G H G E D D F I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G Q K Y G L D V L C P V D E K G H M T S E A P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F E G L F Y D Q A N K P I T E Q L E E K G A L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K L D F I T H S Y P H D W R T K K P T I F R A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S Q W F A S I K D F R D E L L D A V K E T K W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P E W G E T R L Y N M I R D R G D W C I S R Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A W G V P I P V F Y A E N G E P I I T D E T I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
H V S E L F R E H G S N I W F E K E A N E L L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E G F T H P G S P N G K F T K E Q D I M D V W F
- - - - - - - - - - - - - - - - - - - - D V W F
------------------------------------------------------------GACGTCTGGTTT
529530531532533534535536537538539540541542543544545546547548549550551552
D S G S S H Q A V L E E R D D L V R P A D L Y L
D S G S S H Q - - - - - - - - - - - - - - L Y L
GATTCAGGTTCGTCTCATCAG------------------------------------------TTGTATCTG
553554555556557558559560561562563564565566567568569570571572573574575576
E G S D Q Y R G W F N S S I S T A V A V T G K A
E G S D Q Y R G . F N S S I S T A V A V - - - -
GAAGGATCTGACCAATACCGCGGC---TTTAACTCATCGATTTCGACAGCGGTTGCCGTA------------
577578579580581582583584585586587588589590591592593594595596597598599600
P Y K G V L S H G F A L D G E G R K M S K S L G
- Y . G V L S H - - - - - - - - - K M S K S - -
---TAT---GGCGTGCTTTCGCAC---------------------------AAAATGAGTAAATCA------
601602603604605606607608609610611612613614615616617618619620621622623624
N V V V P A K I M N Q F G A D I L R L W V A S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D Y Q A D V R V S D A I L K Q V A E V Y R K I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
N T F R F L H G N I A D F D P A K D A I A V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L R E V D Q Y I L I K L N S L I E K V K K A Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E Y D F A V I Y H A V H N F C A I E L S S F Y M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D F A K D V V Y I E H A D H K D R R S M Q T V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Y E T L L G L V K L I A P I L P H T A D E M W S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
H F T F V S E K S V Q L T D M P E T R D I P N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K E T E E K F D S F M K L R G D V L K A L E T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R N E K I I G K S S V A S L T L Y P N E E A K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L L S S I K E D V K Q L F I V S E L L I G G T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
A E A P E G A Q T F D T G K I V V A Q A E G E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
C E R C R M V S K E I G Q D A D H P E L C P R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922
A G I V K T Y Y Q N
- - - - - - - - - -
------------------------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_ile_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F K K V E N K A N F P K I E E K I L K F W N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N K I F E K S I K Q R E G C E E F T F Y D G P P
- - - - - - - - - - - - - - - - - T F Y D . P P
---------------------------------------------------TTTATTTAGCAT---TTTCAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F A T G L P H F G H F V P N T I K D I I P R Y Q
F A T G L P H F G H F V P N T I K D I I P R Y -
AGTTTCATTATTTTCTATGTATAAATTTATTCTATCGCTAACATCAAAATTTTTTTCTTTTCTTAAATT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T M Q G K Y V K R N F G W D T H G L P V E Y E V
- - - - - - - K R N F G W D T H G - - - - - - -
---------------------TGTCAGCCCTTCCAAGTACAACTCTTTAGT---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E K K L G I S G K Y E I E N Y G I E N F N K E C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R K I V L R Y T E E W K N I I L R L G R W V D F
- - - - L R Y T E E W K N I I L R L . . . . D -
------------TGCATTGGCTACTTTTATCTCGTAGGATGTTCCATTTATTAT------------TTC---
145146147148149150151152153154155156157158159160161162163164165166167168
E K G Y K T M D I S F M E S V W W V F K N L Y E
- K G Y K T M D - - - - - - - - - - - - - - - -
---TAGCTTGCTAATTTCAGTAGA------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K G L I Y E S Y Y V L P Y S P K L A T P L S N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E V N L G E Y K E V N D P S L T I K F K I K D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N E Y L L V W T T T P W T L P S N L G I A V G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E I E Y S K I F D K T K E E I L I L G S K K L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S Y Y D D E N S Y T I I E K F K G S K L E G I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y E P I F N Y F L E Q K D K G A F K V H T A D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V T T D D G T G I V H I A P F G E E D Y R I L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K H T N V D I I D P L D A E C K F T N Q V K D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K G L F V K D A D K K I I E N L K L R N F L F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R E N Y L H R Y P F C Y R T N C P I I Y R P I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S W F V N V E K I K T K L L E V N E K I N W M P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A H L K K G R F G K W L E N A K D W A I S R N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F W G N P I P I W I C S K T G K K I C I G S K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E L E N L S G Q K I E D L H K D Q I D K I T W P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S K D G G K F I R T S E V L D C W F E S G A M P
- - - - - - - - - - - - - - D C W F E S G A M P
------------------------------------------TCCAGATTCAAACCAACAATCGAGAACCTC
529530531532533534535536537538539540541542543544545546547548549550551552
Y A S N H Y P F T N E I N F K N I F P A D F I A
Y - - - - - - - - - - - - - - - - - - - - F I A
GCT------------------------------------------------------------ATGTAAGTC
553554555556557558559560561562563564565566567568569570571572573574575576
E G L D Q T R G W F Y T L T I L G T A L F E N T
E G L D Q T R G . F Y T L T I L G T A L - - - -
TTCGATTTTTTGGCCAGATAGGTT---AAGCTCTTTTTTTGATCCAATGCAAATTTTTTT------------
577578579580581582583584585586587588589590591592593594595596597598599600
A F K N V I V N G L V L S S D G R K M S K S F K
- F . N V I V N - - - - - - - - - K M S K S - -
---TAT---AATTGGAATTGGATT---------------------------CCAATCTTTTGCATT------
601602603604605606607608609610611612613614615616617618619620621622623624
N Y T D P M Q V I N T F G A D A L R L Y L I M S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
P V V K A D D L K Y S D N G V R D V L K N I I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
P I W N A Y S F F T T Y A I I D K F K P P K N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S L A K N N N L D K W I I S E L E S L K K I L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
T E I D K Y N L T K S I E S L L E F I D K L N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
W Y I R R S R R R F W K S E N D K D K N D A Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
T L Y Y A I K T L M I L L A P F I P F I T E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
Y Q N L K T D E D K Q S I H L N D Y P K A N E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
F I N K T I E E K I N L A R K I T S M A R S L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
S L H N I K I R M P I S T I Y I V T K N Q N E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
N M L M E M Q E I I L D E I N A K E M K I K A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E E E L I T Y K A K A N F K E L G K K L G K D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
K A V S T E I S K L K N E D I I K I I N G T S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
E I K V A N A K H Y L S L N D I I L E R E E K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
N L K V I N E E S I T I G I D S L I T K E L Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
E G L T R E F V R Q I Q N L R K E K N F D V S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
R I N L Y I E N N E T L K E M L N K F E K Y I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
T E T L A L N I I L N K S K L E K K I N L A D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
I F T L I G I E K C
- - - - - - - - - -
------------------------------
Class I
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_ile_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T K R T F A P V P T Q P N F R Q L E A D I L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K W K D E Q V F E Q T Q T R P A P A G E F V F Y
- - - - - - - - - - - - - - - - - - - - - V F Y
---------------------------------------------------------------GCCATCCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E G P P T A N G K P A L H H V L A R S F K D L F
E . P P T A N G K P A L H H V L A R S F K D L F
TTC---CGCGAGGGCAATCCGGTCCTGCACCTCGAAGCCCGCCGCCTTGCGGGCCTCCTGAATGGCGCGAAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P R F K V M Q G H H V T R K G G W D T H G L P V
P R F - - - - - - - - T R K G G W D T H G - - -
GAGATCACG------------------------AGGGGTCAGGGCGGTATCGAAGGCCACCAG---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E I S V E K K L G W L G R N H G A S R E E L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F N R L C R T S V W E T I Q D W N E L T E R M G
- - - - - - - - - W E T I Q D W N E L T E R M .
---------------------------CTGACCGGCCTGCACCGCCGTGGCGACGGCGCGGGCGTCCGC---
145146147148149150151152153154155156157158159160161162163164165166167168
Y W L D L G D P Y I T Y Q N S Y V E S V W N L L
. . . D - - D P Y I T Y Q - - - - - - - - - - -
---------CTT------CACCGGAAGCTGCTTGCCGTA---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R R L H E K G L V A Q D Y K V V P L S P R I S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T L S R A E L G E V D S Y R M V D D P S V Y V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L P I V W D T L P E R A H A A L S S L S G E Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Q G L S L L V W T T T P W T L P S N T L A A V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P D L D Y V V A D S P S G R V I V A E G A V E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L S A L H K D A A P L E V L A R F K G R D L E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V E Y E P P F P E V A S Q L G V V S E L H E R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D G K P V L H F V V M A D F V S D V D G S G V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H E A P A Y G A E D L E V A R A Y G V P L M F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V D D H G I L Q V T H E Q G K F F K D A D K G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I A D M K A R G L M F W A G T L K H R Y P F H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R T G D P I L Y F A K K G W Y I R T S Q V A G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
M L A Q N E K I N W V P G N I K H G R F G N W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E G N V D W A I S R E R Y W G T P L P F W Q S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S G Q L R V I G S V A E L S E L A G R D L S D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D L H R P Y I D D I T F T L D G E E Y R R V P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V L D V W F D S G S M P Y A Q W G L L L N E Q G
- - D V W F D S G S M P Y - - - - - - - - - - -
------CAGGTCGCGCCCCGCCAGCTCGGAGAGTTCCGC---------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E A V R G A E Q F A K H Y P A D Y I C E A I D Q
- - - - - - - - - - - - - - - - Y I C E A I D Q
------------------------------------------------GGCCCAGTCCACGTTGCCCTCCAG
601602603604605606607608609610611612613614615616617618619620621622623624
T R G W F Y S L H A I S T M L Y D Q P A Y K N V
T R G . F Y S L H A I S T M L - - - - - Y . N V
CCAGTTGCC---GCGCCCGTGCTTGATGTTGCCCGGCACCCAGTT---------------CGC---CATCTC
625626627628629630631632633634635636637638639640641642643644645646647648
I C L G H I V D E K G L K M S K S K G N V V A P
I C L - - - - - - - - - K M S K S - - - - - - -
GCCCGCCAC---------------------------CTTGGCGAAGTAGAG---------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L P L F D Q Y G A D S V R W Y M F M A S D P G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
Q K R F S E R L V A E A Q R S Y V N T L W N V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
S F F V L Y A N L D Q P D L A A A P A V A E R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E M D R W L L A R L E E T V R D V T A A L E S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D A R S G G R A L E G F V D D L S N W Y V R R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
R S R F W G E G G T V D T A A Y A T L H E A L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V V S Q L T A P F T P F L A D A L Y R N L S G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E S S V H L T P W P T V R A E R L D R K L T A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
M A A V M K V V E L G R A V R G A H N L K T R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
P L A G V Q V R A A S P E A L D A L K R S Q T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
I M E E L N V K A V T F L E G D T D L V Q Y S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
R P N L P V V G K Q Y G K Q L P V L K K A L T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
A D A R A V A T A V Q A G Q G F S V Q A D G V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
F D L T P G S V L V D A K A P E G V A A A E D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
G Y L V A F D T A L T P E L V R E G L A R D L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
R A I Q E A R K A A G F E V Q D R I A L A L E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
D G E A L E A A Q A W Q D F I A G E V L A E Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
A Y G S G E G F R A E V E G G A V T L K K L
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_ile_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H E K L I S G S S W I F H S A G P Y K D T V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L P I T K F N M R A N S T Q R E P E L Q K F W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K N G I Y E Q L L K S N P G E V F T L H D G P P
- - - - - - - - - - - - - - - - - T L H D . P P
---------------------------------------------------ACCTTACACGAT---CCTCCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y A N G D T H L G H A L N K I L K S I I V N Y Q
Y A N G D T H L G H A L N K I L K S I I V N Y -
TATGCAAATGGGGACACACACTTGGGGCATGCGCTGAACAAGATCTTAAAATCCATCATTGTCAACTAC---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L L G G K K A R Y V P G W D C H G L P I E L K V
- - - - - - - R Y V P G W D C H G - - - - - - -
---------------------AGATATGTGCCTGGCTGGGACTGCCATGGC---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L Q S M S D E Q R R E L D P I K L R R K A R D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A L K T V K A Q R E Q F K R Y G I W G D W D A P
- L K T V K A Q R E Q F K R Y . . . . D - - A P
---CTGAAGACCGTCAAAGCGCAGCGCGAGCAGTTCAAGCGGTAC------------GAC------GCCCCC
169170171172173174175176177178179180181182183184185186187188189190191192
Y L T L E P K Y E A A Q L R V F G K L V A A G H
Y L T L E - - - - - - - - - - - - - - - - - - -
TACCTGACGCTGGAG---------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I Y R G R K P V H W S P S S A T A L A E A E L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y P E G H T S R S I Y V A M P L T S L G D A M P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E D L K E K L S G A A V A I W T T T G W T I P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N E A V A V N E R M N Y G A E S W A H R R L V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A E E L V D S L G A K F G V Q L Q R L G S L T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G Q L A G C Q Y R H P L F E R T S P V L I G G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y I T T E S G T G L V H T A P G H G Q E D Y Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G L K N G L P I S S P V D D D G V F T E E A G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F K G L P V L K E G T A A V I E A L Q Q K G C L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L K E E R Y A H K Y P Y D W R T K L P T I F R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T D Q W F V S V E G F Q A A A M D A V R S V Q W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I P A S G E K R I T S M V E G R S D W C I S R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R S W G V P I P V L Y Y T D S G E P L M T E E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I E H M A A V V E A K G T D A F W Q L P I E D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L P E R L R T E A P K L R K Q L E T M D V W F D
- - - - - - - - - - - - - - - - - - - D V W F D
---------------------------------------------------------GACGTGTGGTTTGAC
553554555556557558559560561562563564565566567568569570571572573574575576
S G T S W A G C V E S T P G L A F P A D L Y L E
S G T S W A - - - - - - - - - - - - - - L Y L E
AGCGGCACCAGCTGGGCC------------------------------------------CTCTACCTGGAG
577578579580581582583584585586587588589590591592593594595596597598599600
G S D Q H R G W F Q S S L L T A A A A R G S A P
G S D Q H R G . F Q S S L L T A A A A - - - - -
GGGAGTGACCAGCACCGTGGC---TTCCAGAGCTCTCTTCTGACCGCAGCAGCCGCG---------------
601602603604605606607608609610611612613614615616617618619620621622623624
Y K A V L T H G F T L D E K G Y K M S K S L G N
Y . A V L T H - - - - - - - - - K M S K S - - -
TAC---GCTGTGCTGACGCAC---------------------------AAGATGAGCAAGTCG---------
625626627628629630631632633634635636637638639640641642643644645646647648
V V D P R S I I E G G K D K N K E P A L G A D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L R L W V A S V D Y T G D M V M G P S V M S Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A D V Y R K L R F T L R F I L G N L H D F A P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
S D A V P Y D A L P A T D R F I L S S F A T L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S G L S A S Y E T Y Q F F R V Y Q A V Q R F V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A D L S N W Y L D V I K D R L Y V S A D D S F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
R R A A Q T V L H S L L Q G L L P A L A P I V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
H L A E D A W Q A L P W E A P S V S V F Q A G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L A P P Q Q W A A I P A D Q Q R A F K A L L Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R E E V N M V L E R A R Q D G F L G A S L E A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V L L H V A D A D L A A S L R S L Q G A G N A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
D P L R Y A F I V S Q A E L A E D E G Q V A S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
S Y S K A T V L E G V G S I A V G V S R A D G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
K C S R Q A P A P G H S S L M H K C W N Y S T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
V G C D H D H S Q L C E R C A P V I R G M G F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
9859869879889899909919929939949959969979989991000
L P A A V V P A P E A A A V P L
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_ile_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A G E G Q Q Q Q Q Q D P P A G H Q G V P V T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y P D V L D F S K M E E E V L A M W R E K D C F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R T S M K L S E G R Q P F S F Y D G P P F A T G
- - - - - - - - - - - - - S F Y D . P P F A T G
---------------------------------------AAAGTACACATC---CTCGTCCGTCACCACTAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L P H Y G H I L A G T I K D M V T R F A Y Q T N
L P H Y G H I L A G T I K D M V T R F - - - - -
CTTCGCCTTCTTACGCAGCTGCTGTACGCGGCTCACGAACTCACGCGCGCGCCACGA---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H H V I R R F G W D C H G L P V E Y E I D K M L
- - - I R R F G W D C H G - - - - - - - - - - -
---------CTTGTCAACCAGCACAACGACGTCGTTGTC---------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G I K T S H D V A K L G I D K Y N D E C K K I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T R Y V D E W R K T V E R V G R W I D F D N D Y
T R Y V D E W R K T V E R V . . . . D - - N D Y
GAACTTGGCCACCTCATTCTGCGTCATGGCCTGGATACCCTT------------CAT------GCGGTACTT
169170171172173174175176177178179180181182183184185186187188189190191192
K T M H L T Y M E S I W W V F S Q L W E K K M V
K T M H - - - - - - - - - - - - - - - - - - - -
CCTGCCAAGCAC------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y R G F R V M P Y S T A C T T P L S N F E A N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N Y K E V S D L A V T V A F Q A R A D P N T Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L A W T T T P W T L P S N L S L C V H P E L D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V K V L D N K S K R H Y W L A E A R L A E V Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K K D S K K A S K A K D V D N A A E A D A A P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T V V E K V K G A Q L V G E K Y V P L F P Y F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S S M S A T A F R V I S G T Y V T T D A G T G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V H Q A P A F G E D D Y Q A C L D A G I F E K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G K F V C P V D E N G M F T S E V T D F A G K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V K A A D P E I I K A L E T K G H L F H K A S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V H S Y P F C W R S D T P L I Y K A V E S W F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N V E A F R D R L I E C N D K T Y W V P D F V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T R R F S N W L A E A R D W N V S R N R Y W G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P M P V W H S E D W E E V V C I S S I K Q L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L S G V T G I T D I H R Q F V D D I T I P S K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P G M P P L K R V P M V F D C W F E S G S M P Y
- - - - - - - - - - - - - D C W F E S G S M P Y
---------------------------------------GGTGATGCCGGTGACGCCGGAGAGCTCCTCGAG
577578579580581582583584585586587588589590591592593594595596597598599600
A Q E H F P F E N Q E K F K S L F P A D F V S E
- - - - - - - - - - - - - - - - - - - - F V S E
------------------------------------------------------------CGGCGTGCCCCA
601602603604605606607608609610611612613614615616617618619620621622623624
G L D Q T R G W F Y T L L V L G V A L F D V S P
G L D Q T R G . F Y T L L V L G V A L - - - - -
GTAACGGTTGCGTGACACGTT---GTCACGCGCCTCGGCGAGCCAGTTGGAGAAGCG---------------
625626627628629630631632633634635636637638639640641642643644645646647648
F R N V A V S G L V L A E D G K K M S K R L K N
F . N V A V S - - - - - - - - - K M S K R - - -
ATC---TACCCAGTACGTCTT---------------------------GAAGGCCTCGACGTT---------
649650651652653654655656657658659660661662663664665666667668669670671672
Y P E P K V V I D T Y G A D A L R M Y M I S S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
V V R A E P L R F R E A G V K A V V K D I L L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L F N A A K F F I S N T N Y C T A A G G Q V S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Q V R S T N E M D R W I L A S C Q S L L R Y V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A E M R L Y H L Y N V V P G I L R F V G D L S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
W Y V R M N R R R M K N A T D S E D R S Q A L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
T M L Y L L F S V S R I V G H I A P F V A E M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
Y Q Q I K P L L P A N E Q V D S V H Y L M I P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E D T S L D D P E L E R A M S R M M N I V D L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
R V L R D Q M V I P I K R P V R Q V V I V H P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
Q Q Y I D D V R K V A G Y I K D E V N A F E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
M S S G E N Y L E T K L D A N F E V L G R K Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
K E M P A I R K G I Q A M T Q N E V A K F L H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
K K G V V V G K E L T I E D V K V L R Q V K E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
I A D F Q S N T D N D V V V L V D K R Q D Q E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
I D S W R A R E F V S R V Q Q L R K K A K L V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
T D E V D V Y F E A E E A D L T A S I L H S K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
Q I N Q T L R G V W T T M D Q K P S D A E L V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
010611062106310641065106610671068106910701071107210731074107510761077107
E E D N N I S G V A V R L V F T K P K A
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_ile_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A F T P Y V P P S V L H I P Q G L L D F P A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E E E M L N Y W D Q I Q A F E T Q L R L T R S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P P F N F Y D G P P F A T G L P H Y G H L L A G
- - - N F Y D . P P F A T G L P H Y G H L L A G
---------AACTTCTACGAC---CCGCCGTTCGCCACTGGGCTTCCTCACTACGGTCATCTTTTAGCCGGT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T I K D V V C R Y Y S M N R R Y V N R R F G W D
T I K D V V C R Y - - - - - - - - N R R F G W D
ACCATAAAGGATGTTGTCTGTAGATAT------------------------AATCGTCGTTTTGGCTGGGAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C H G L P V E Y E V D K M L D V K S P S D V I N
C H G - - - - - - - - - - - - - - - - - - - - -
TGCCACGGA---------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K I G I R K Y N Q T C R S I V M R Y S Q E W E A
- - - - - - - - - - - - - - - M R Y S Q E W E A
---------------------------------------------ATGAGATATTCGCAGGAGTGGGAGGCC
145146147148149150151152153154155156157158159160161162163164165166167168
I V K R S G R W I D F K R D Y K T M N L L F M E
I V K R S . . . . D - - R D Y K T M N - - - - -
ATCGTCAAGCGATCT------------GAC------CGTGACTACAAGACTATGAAT---------------
169170171172173174175176177178179180181182183184185186187188189190191192
S V W W V F K E L Y D K G L V Y E G T K V M P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S T A C A T P L S N F E A N L N Y K E V Q D M T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
C I V S F P V I V P D T N R E V G G T V D K N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N E E K I S L W K K V F S P F P E V H L V A W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T T P W T L P S N L A L C V N P S L A Y L L C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R V L D S D G G K A E N S P C Y L V A E S L V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T L F P P L V D K K T K K E T P T H E V L H R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V G Q D L A G L R Y N P L F P Y F K S S Y G A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H A C W K V V A D D Y V T S D S G V G I V H I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P F F G E D D Y R V G L E N N I I V K D G D I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
C P L D D S G N F L P D V V D F A G L Y V K D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N K P I L K Y L K E A G R L V S Q S T C T H S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P Y C W R S D T P L I Y R A I P S W F V R V E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I K D S L I R N N L K A S W V P K A I Q E K R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H N W L E N A R D W S I S R N R F W G C P I P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
W M S A D K T Q L K V I G S I S E L S E L T G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P L T R I R D I H R D Y L D N M T I P D P R G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D Y P P M R R I S P V F D C W F E S G S M P Y A
- - - - - - - - - - - - D C W F E S G S M P Y -
------------------------------------GACTGCTGGTTTGAGTCTGGGTCTATGCCCTAT---
601602603604605606607608609610611612613614615616617618619620621622623624
Q K H Y P F H P D Y K K A Q G V D A F L K E F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G D F I A E G L D Q T R G W F Y T L L I L S T A
- - F I A E G L D Q T R G . F Y T L L I L S T A
------TTTATCGCTGAAGGCCTTGATCAGACACGAGGC---TTCTACACACTTCTCATTCTCTCAACAGCT
649650651652653654655656657658659660661662663664665666667668669670671672
L F D S P P S M N C I V N G L V L A S D G Q K M
L - - - - - S . N C I V N - - - - - - - - - K M
CTC---------------TCC---AACTGCATCGTCAAC---------------------------AAGATG
673674675676677678679680681682683684685686687688689690691692693694695696
S K R I R N Y P D V N H I I N T Y G S D A L R L
S K R - - - - - - - - - - - - - - - - - - - - -
TCCAAGCGT---------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Y L V N S P A V R A Q E L R F R E E G V K G V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
K D L F V P W Y N S F R F F T Q Q A T R Y H E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
T G K D F L S L L I H S E K P L F E E A L K R M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
V T S V L D M W I L A S F E Q L V A T V R R E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A S Y Q L Y N V L P E L L R F I D D L T K W Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R F N R D T L K G E D G V S A T Y V S L N V L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
Y V L F M L C R L M A P Y T P F V C D W M Y L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
L R P V M N L P G V F D K V A Y R S I H F W A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
P S L A P N T F K F Q A Q P N V I Q K M T A L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
D V I M L G R M V R K D K C G V T S F K M P L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
S V T I A H D R K E I L D E L K T L V S F I Q S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
E L N V L E V N F H V G E E G L A T F A V I P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
F I A I K E V Y A G D K K V L G N V I N K V K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
L C D I S K P E N L A F V K E L R K T G R C Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
D G I T V T S D L C K V M L E P I P V P N Y A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
A A D E N G F L C S F D T R I T Q E I K Q K A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
010611062106310641065106610671068106910701071107210731074107510761077107
V R I L F S K I Q Q L R R R V G M D F R D K A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
810791080108110821083108410851086108710881089109010911092109310941095109
V Y V Y S V Q E G D E L V Q Y A V D S I A D R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610971098109911001101110211031104110511061107110811091110111111121113111
N G T I R N S E P G N I E S K S A T E M A S I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
411151116111711181119112011211122112311241125112611271128112911301131113
N D I F K C T V Q I V K Y
- - - - - - - - - - - - -
---------------------------------------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_ile_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T T N P L S H Y K D T L N L L K T E F S M R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N A A I R E P E L Q S F W E K E K T Y E K L S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S N S G E K F V L H D G P P Y A N G D L H M G H
- - - - - - - V L H D . P P Y A N G D L H M G H
---------------------ACTCAATACATT---AAAAGATTCGCATCCCAAATCTAGTTGTGAAACTAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L N K V L K D I I N K Y Q L L R G R K V C F V
V L N K V L K D I I N K Y - - - - - - - - C F V
AAGCCAGTCACGAAGTACATCAACTTCCCTATTACCAGA------------------------AATCAATGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P G W D C H G L P I E L K V L Q S L E S K E R Q
P G W D C H G - - - - - - - - - - - - - - - - -
CTTACTTTTAATTTCCAATCT---------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I L T P I A L R K K A K E Y A K K Q I K I Q K A
- - - - - - - - - - - - - - - K K Q I K I Q K A
---------------------------------------------AGGAATTTTAAGATTATTTTGTCTCCA
145146147148149150151152153154155156157158159160161162163164165166167168
G F I R W G V W G E W D K P Y L T F N K D Y E A
G F I R W . . . . E - - K P Y L T F N - - - - -
ATTATTAGGGACGGT------------ATT------AGATAGATCTTCTACGGGATA---------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q Q I G V F G N M V L A G H I Y R G L K P V H W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S P S S R T A L A E A E L E Y P D D H I S P S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y V S F P I I E L T E N L C Q E L K K Q G L A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N R I D Q N L K R Y F D V V I W T T T P W T L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A N L G I S V S A S L E Y C V V V D E Q N R H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I I A K V L V D N L S T I L D R S F K I K A T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K G F E L E G L I Y R N P L I D R T N T V I L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G D Y I T T E T G T G L V H T A P G H G V D D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N T G H S Y N L P I L C P V D Q A G T L T S E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G A F S G L N V L K D A N T S I I Q A L H I T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D L I K K E D Y N H R Y P Y D W R T K K P T I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R T T E Q W F A S L E G F R K K A L E A I Q E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V W I P D S G R N R I E S M V K E R G D W C I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R Q R T W G V P I P V F Y E K S T G E V L L N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V T L N H I Q K L I A E H G S D V W W E F E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D L L P P I Y T A E S N R W R K G T D T M D V W
- - - - - - - - - - - - - - - - - - - - - D V W
---------------------------------------------------------------GCGATGATT
553554555556557558559560561562563564565566567568569570571572573574575576
F D S G S S W A S V T S K R E G L S Y P A D L Y
F D S G S S W A - - - - - - - - - - - - - - L Y
GTAATCCTCTTTTTTAATGAGATC------------------------------------------TTTGAG
577578579580581582583584585586587588589590591592593594595596597598599600
L E G S D Q H R G W F Q S S L L T S T A V N G Y
L E G S D Q H R G . F Q S S L L T S T A V - - -
TACATTTAGCCCTGAAAATGCCCCTGC---ACTCGTGAGAGTACCTGCTTGGTCTACTGGACA---------
601602603604605606607608609610611612613614615616617618619620621622623624
A P Y K K V I T H G F V L D E K G R K M S K S L
- - Y K . V I T H - - - - - - - - - K M S K S -
------ATAACT---CCCAGTATTAAA---------------------------ATGTACTAAACCTGT---
625626627628629630631632633634635636637638639640641642643644645646647648
G N I I D P A S I L K G G K N Q K D E P P Y G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D I L R L W V S S V D Y S V D V S I G S N V L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
Q L A D V Y R K V R N T S R Y L L G N L H D F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P I T D G I D I E E L P L L D K W M L N R T A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
V I D E V T T A F E Q F E F F R F F Q T L Q N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
C V V D L S N F Y L D I A K D R L Y V S A A N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S R R R S C Q T V L H L L L E C I A S L I A P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L C H M A E D I W Q S L P Y P V E D L S V F N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G W P T V P N N W R Q N N L K I P I N H L R E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R S I V N R Q L E I T R S N G M L K G S L E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V R L E I K S K P L I R A I E M L V H S G N R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
V D V L R D W L L V S Q L D L G C E S F S N V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
S T N K A E E T S F D V I V Q V S K A E G S K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
E R C W H Y E K D T G I D T G Y P S L C R R C I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967
N T L E R R K
- - - - - - -
---------------------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_ile_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K F D S N L S I N D I E T K I L K F W K D T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
C F K K S N E L S K N K K K Y T F Y D G P P F A
- - - - - - - - - - - - - - - T F Y D . P P F A
---------------------------------------------AATAGGATAAAA---TTTGGTAATTTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T G L P H F G H I L A G T V K D V I T R Y Q Y Q
T G L P H F G H I L A G T V K D V I T R Y - - -
CTTAATCTTTTCACTATCTACTTCCACATTAACTGTGTCATTCATTTTAAGCCCGCAGGATTT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H N K R V D R R F G W D C H G L P V E F E I D K
- - - - - D R R F G W D C H G - - - - - - - - -
---------------AAATTCTCGTGCCAATTTTTTCTCTAATAC---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N L G I S V K Q E I L E M G I D K Y N A E C K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I V M K H S S E W K D T V E K M G R W V D F D N
- - M K H S S E W K D T V E K M . . . . D - - N
------AACATTATATTTTTCTTCTGATAAATCTAAAAATGCAAGATC------------TTG------TTT
145146147148149150151152153154155156157158159160161162163164165166167168
S Y K T M D L S F M T S V W Y V F S Q L Y K K G
S Y K T M D - - - - - - - - - - - - - - - - - -
ATTAATAATCTTAATTTT------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y V Y R G Y R V M P F S T G C M T T L S S S E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K S N Y K M V N D L S A V V E F P L K S K L F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K K V S I L A W T T T P W T L P S N C G L V V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K D F D Y Q I F E I D H K F Y C M L P N R I Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F N K K E V I L H E L F K G E L L I G L E Y E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P F N Y F E E Y R R C G F F K I I G G S F V S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T D G T G I V H A A P A F G E D D Y N C F V E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N L I K Q N D L V P C P V D E N G K F T A E V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D Y K G I Y V K D A D K L I I K H L K E K I F C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V K Q I S H N Y P F C W R S E K P L I Y R L V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S W F I K V S D S V D K L I K N N E I I N W V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K D I K H K K F G K W L S N A K D W A F S R S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F W G T P I P L W I S D D Y S E I L C V E S A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E L E K L S G K K I T D L H M E F I D D I I L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K N G K T L R R I P E V F D C W F E S G C M P Y
- - - - - - - - - - - - - D C W F E S G C M P Y
---------------------------------------CTGTGCATAAGGCATACATCCCGACTCAAACCA
529530531532533534535536537538539540541542543544545546547548549550551552
A Q H S W P F R K V D N L N C E E I R H H F H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
S D N T L V Y E N K I L E N F P A D F I G E G I
- - - - - - - - - - - - - - - - - - F I G E G I
------------------------------------------------------TTCAACACATAAAATTTC
577578579580581582583584585586587588589590591592593594595596597598599600
D Q T R G W F Y T L H V I S T L L F D K P A F K
D Q T R G . F Y T L H V I S T L L - - - - - F .
ACTATAATCGTCACT---CCATAGTGGAATTGGTGTACCCCAAAACCTACT---------------ATC---
601602603604605606607608609610611612613614615616617618619620621622623624
N V I V N G I V L A E N G K K M S K K D K N Y P
N V I V N - - - - - - - - - K M S K K - - - - -
AGCATTGGATAACCA---------------------------TTTAGGCACCCAATT---------------
625626627628629630631632633634635636637638639640641642643644645646647648
D P N I V M K T F G A D S L R M Y L I S S P V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E A D N L L F K E D G V K D V S K L L I I P W M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
N V L K F Y T T S L Q K R N D C E K L E L D N W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
I N Y T F N E F L S S V S N Y M N N Y Q L S K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
C G L A Y K F L D N L S N W Y L R I H R E E I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S G N T K I L F N I L K K F S V I M S P F A P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
F S E Y S F Q C L L S S Q Q N E K S S S I N S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
H F Q M Y P E A Q D S G D N S F E N A K D I I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A I R Y L R D K H T I S L K T P L K E V K I I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
D E L F M K D A A K F S N T I I R E C H V F N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
I F V K E S E V P E L K I E Y K A K P C F E Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
K K D L K T M N D K I K I I N K L T Q S E I R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
L A F L D L S E E K Y N V K R E N I L I E K K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
T F P T G L C F A S N K F V I L V D N T I D D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
V L E K K L A R E F N S F I Q K L R K S C G L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
M N D T V N V E V D S E K I K Q I T K K F Y P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
N F S T E G Q I V S P I D S D A Q I D V F S Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
G Q E L K V I L R L N K F L
- - - - - - - - - - - - - -
------------------------------------------
Class I
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_ile_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_ile_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T T F S V V S E R P D F P K L E E E I L E Y W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R K I N I L K L T L E K T K G R P N Y S F Y D G
- - - - - - - - - - - - - - - - - - - S F Y D .
---------------------------------------------------------TCATTTTATGAT---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P P F A T G L P H Y G H I L A G T V K D V V T R
P P F A T G L P H Y G H I L A G T V K D V V T R
CCTCCATTTGCTACAGGATTACCACATTATGGTCATATACTTGCAGGTACTGTTAAAGATGTAGTTACAAGA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y A T Q K G Y Y C E R R F G W D C H G L P V E H
Y - - - - - - - - E R R F G W D C H G - - - - -
TAT------------------------GAAAGAAGATTTGGATGGGATTGCCATGGA---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E I D K Q L N I T S R E D V L N K G I D F Y N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S C R S I V L R Y T Q E W K S T V E R V G R L I
- - - - - - L R Y T Q E W K S T V E R V . . . .
------------------TTAAGATATACTCAAGAATGGAAATCAACTGTTGAAAGAGTT------------
145146147148149150151152153154155156157158159160161162163164165166167168
D F D N G Y K T M D L N F M Q T V W W V F K Q L
D - - N G Y K T M D - - - - - - - - - - - - - -
GAT------AATGGTTATAAAACTATGGAT------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F D K N L V Y R A Y R V M P Y S T A C A T P L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N F E C N L N Y K D V N D P S V I I T F P L L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D P N I Q F L A W T T T P W T L P S N V A I A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H P E K K Y L Y F K T N H S N D I T Y V V A E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R L E W V L S E L K I K E Y N I I S D C I G A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L H N K K V I P L F D Y F K N H E S S H Q F W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I L A D N Y V T D N T G T G I V H M A P A F G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D D Y R V C V S N G I I D N H G T N L P C P M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S N G R F T E P V N D L K G I W F K D S D K I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K Q E L K K K S R L L T D N T C M H S Y P F C W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R S D T P L Q Y R A V P S W F I N V E S L K D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L L I N N E K T N W I P N Y V K E K R F H N W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q D A R D W C V S R N R F W G T P I P I W V S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
D Y T I I K C I G S I E E L K S L A S N L K D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E I N D I H R H F I D Y I E I P D P R G N N Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P L K R I E E V F D C W F E S G S M P Y A S I N
- - - - - - - - - D C W F E S G S M P Y - - - -
---------------------------GATTGTTGGTTTGAATCTGGTTCTATGCCTTAT------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y P F E N Q E L F N N I F P A D F V G E G L D Q
- - - - - - - - - - - - - - - - F V G E G L D Q
------------------------------------------------TTTGTTGGTGAAGGTTTAGATCAA
577578579580581582583584585586587588589590591592593594595596597598599600
T R G W F Y T L M V L S T A L F D Q P A F K N I
T R G . F Y T L M V L S T A L - - - - - F . N I
ACAAGAGGA---TTTTATACATTAATGGTATTATCAACAGCATTA---------------TTT---AATATT
601602603604605606607608609610611612613614615616617618619620621622623624
I V N G L V L A S D G K K M S K R L K N Y P D P
I V N - - - - - - - - - K M S K R - - - - - - -
ATTGTTAAT---------------------------AAAATGTCAAAAAGA---------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L D I V N K Y G A D S L R L F L I N S P V V R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E T L R F K E E G V K D V I K D V L L P W Y H C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
Y R F F V Q E A I R Y E N T N H N I K F K S N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Q V I K N T N N I M D K W I Y S E A Q S L L K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
V K T E M D A Y R L Y N V T P R L I S F L D T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
C N W Y V R L N R D R M R G I Y G M N D T K N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L E I L Y Q V L M L T V K L L S P F I P F T C E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L L Y S N L K N A L I D E L E E E K P E T V H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L L I P E V E E E F I D K K I E E A I N Q L R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
I I V M G R N L R E K K K V S V K T P L K S I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
I V H K D K S V L D Y L V E S K L I N Y I K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L N I L Q V I T D N N S E F E K I T K L V A T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
N F K V L G S R L G K S M K D V T N Y I K N E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
N N E I I Q Q F L K D G T I K I H G Y E L N L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
E I I I Q T V V D N N S V I D M N N E I I Y E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
S S Q F V I G L D F T S D I E F E N M A Y S R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
L A N K I Q K I R K E K N M D P D A N V T I Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
Q L I S N K N E S K K F H T V M T S Y N D Y L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
K I I R K P I K E I S D S E L L N S I K D R I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
010611062106310641065106610671068106910701071107210731074107510761077107
F E C E I E V G M D D K V N V I V I K N
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_leu_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S R K E P I N E F A A K L Y E I A R K W Q E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W M K S R I F E V E P D E S K P K F F I T A A F
- - - - - - - - - - - - - - - - - - F I T A . F
------------------------------------------------------GTCTTTTAGCTG---TAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Y P N S P L H L G H S R T Y T I T D V Y A R Y
P Y P N S P L H L G H S R T Y T I T D V Y A R Y
TGCAGCTTTCTCGTCGAACTCCTGCACACCATCTATCAGCGATAGCAACGCCTCGTCGGCGCTGCGGAGGAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L R M R G Y N V L F P M G F H Y T G T P I L T M
- - - - - - - - L F P M G F H Y T G - - - - - -
------------------------TGCCGCGTCCTTCTTGGGAACACCTGCGTT------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E S I A K G D R E L I E L M I E V Y D V P P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D I E K L K E P L S L A R Y F H N D A K M A M I
- - - - - - - - - - - - R Y F H N D A K M A M I
------------------------------------TACACGCAATATAGATTTCACATCCTCAACTATCTT
145146147148149150151152153154155156157158159160161162163164165166167168
E S G Y S I D W R R E F T T I D E E F K R F I V
E S . . . . D - - R E F T T I D - - - - - - - -
GTCCAC------------TAG------TTCAGGGTCACGCTTCTCCGG------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
W Q F T K L K E K G L I K K G T H P V G W C P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
H N M P V G M H D T K G D V E P E I G E F T L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L F E L E K D L Y L P A A T L R P E T V F G V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N I W V N P K A E Y V V V K L D G K R Y I V S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R A A F K L R F Q R D D V V E E A A I K G E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L G K R A R N P A T G K A V P I L P A E F V D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D T A S G I V M S V P A H A P Y D Y V A L E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K R E H P E V L E R L G V D P D E L R P I P L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R V K G Y G E I P A K E I V E K M G I K S Q K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R D L L D E A T K K L Y S D E Y H Y G V V R E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I I E H V Y S D M P E P Y R S F A V A P V K A W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I A G K S V V E A R E A A T K W L A A L G Y G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K M Y E V L N R P V Y C R C G T E I V V K V L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
D Q W F I D Y G N S E W K K L A Y E L L N S M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I V P E D M R E E F V K T I D W L H E R A A A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T R G L G T E L P W A K G W I I E S L S D S T I
- - - - - - - - - - - - - - - - E S L S D S T I
------------------------------------------------CGCCTCCCTGGCCTCTACAACACT
553554555556557558559560561562563564565566567568569570571572573574575576
Y M A F Y T I I H K I R M Y G I K P E Q L T V E
Y M A - - - - - - - - - - - - - - - - - - - - -
CTTGCCAGC---------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
F W D Y V L L G K G S A E E V A K K T G I K R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I V E E L R R D F D Y W Y P L D S R H S G R D L
- - - - - - - - - - - - - - - - S R H S G R D L
------------------------------------------------TTCTTTAGCTGGTATCTCCCCATA
625626627628629630631632633634635636637638639640641642643644645646647648
V P N H L T F F I F N H A A I F P R D K W P R Q
V P N . L T F F I F N H A A I - - - - - - P . Q
GCCCTTTAC---TATGAGCGGTATAGGCCGTAGCTCGTCTGGATC------------------TAC---GGG
649650651652653654655656657658659660661662663664665666667668669670671672
I V V N G F V L L E G K K M S K S L R N I V P L
I V V N - - - - - - - - K M S K S - - - - - - -
ATGCTCTCTCTT------------------------GTATGGAGCATGTGC---------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R R A L R V Y G A D T V R A T L L A A A E I L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
D A N F S E D L A K S V M S Q L R K F E N Y A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L S R S M D S E E T I A D K W L L S M L Q Q R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E A T T K A L D E L R T R A A T I N I L Y E M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
N D V A K Y L E L R G G K P G P A L K E Y I E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
W T K M M T P I A P H I A E E V W H E I L G K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
T F V S I E T W P S V D P E K R D P E V E L I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S Y V D K I V E D V K S I L R V Y K G E A K R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V I A V A K P E S W H I A R I V S S Y V A K R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
Q L R D A I R A V I N A G V P K K D A A Q I T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
K L Y E F L R S A D E A L L S L I D G V Q E F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
E K A A I V Q L K D Y I V R K T G I E Q I E V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
Y V D E A E N K M P Q Q K I R Q V I P L R P A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987
L I E
- - -
---------
Class I
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_leu_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S V D F V K I A E K W Q K R W E E D K I F E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P S K L K Y T E Q E K K D K F F I T A A F P Y L
- - - - - - - - - - - - - - - F I T A . F P Y L
---------------------------------------------ATTTAATATGTT---TTCGTCTATTGG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N G V L H A G H L R T F T I P E I T A R Y Q R M
N G V L H A G H L R T F T I P E I T A R Y - - -
GTTAGAAATTCCATTTTTAACTATTTCATTTATTAATTTTGGAATTTCTTTTCCATATCTTCT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N N K T V L W T F G F H V S G T P I I G L A E L
- - - - - L W T F G F H V S G - - - - - - - - -
---------------TGGCATCATTTTATTAACGGGAGCTCCTTT---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K K Q A P E T I W A Y N K L H N I P M G E L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T L T T P E N I V N Y F S K K A T E S F K K M G
- - - - - - - - - N Y F S K K A T E S F K K M .
---------------------------TTCTTCCCCCAATTCACAATTTTCATTTATATAACTATTATC---
145146147148149150151152153154155156157158159160161162163164165166167168
F A L D W R R N F K T D D E T F K K F V E W Q F
. . . D - - R N F K T D D - - - - - - - - - - -
---------TGT------TGATATATAATTATTATTTTT---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L K L K E K N L I V K G S H P V R Y C P S C D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P V E D H D L L K G E E A T L Q E Y I L L K F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T K L N I E I D G E D K E Y E C I I P M A T L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P E T I Y G V V N A W I N P N D T Y H I I K V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D E V Q S Q E E G S D E I S L K Y N G I W I V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K E A S D K L K N Q D R T V E L I K E I K G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L V G K I V I N P V N N K E V P L Y P A D F V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S E M G T G C V M S V P A H A P K D F V A L R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y Y S S I N K E L T D D E L I S L I K I D G Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K Y P A K E I V E K M G I T N Q K D E K L E D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T H T I Y K Q E F H K G I L N E N C G E Y E G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A V R D I K D K L A S D F I N N N M A E T L Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F S I P E V V C R C G E K C I V K T V K G Q W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I T Y S D L E W K K K A H N W V D K M N F V P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T I R M D F H N K I D W M K D K A C A R K K G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G T R F P F D K D W V I E S L S D S T L Y M A Y
- - - - - - - - - - - - E S L S D S T L Y M A -
------------------------------------CTCATATTCTCCACAATTTTCATTTAATATCCC---
553554555556557558559560561562563564565566567568569570571572573574575576
Y T V A K T I N T N N I L P E Q L I P E L F D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V Y Y G K G D I N E I S N N T K I P V E L I N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
M R N E F E Y Y Y P L D W R C S A K D L V P N H
- - - - - - - - - - - - W R C S A K D L V P N .
------------------------------------AAGTGCTACAAAATCCTTTGGAGCATGTGCTGG---
625626627628629630631632633634635636637638639640641642643644645646647648
L T F M I F N H V A L F D D E K Y Y P K G I V V
L T F M I F N H V A L - - - - - - - P . G I V V
ACTCATTACACAGCCTGTTCCCATTTCGGAGCT---------------------TGG---CTCCTTATTATT
649650651652653654655656657658659660661662663664665666667668669670671672
N G Y V T I E G K K L S K S K G P V L P I E E V
N - - - - - - - - K L S K S - - - - - - - - - -
TAC------------------------CAATTCCTCTCCCTT------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A T N Y G P D V G R F Y I T T C A E L P H D A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V K F K E M E H A R D N L I R F Y E L A T E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D T E K T I T E L S T I D K W L L H K V H S D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
K I I N E S Y N E F Q L R K I G T L F Y G L T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
N L K W Y K R R G G N N N Q L L K Y V V E I W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K V L A P I T P H L C E E I W E M F G Y N K N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
N Y I S N E T F P Q L D N S Y I N E N C E L G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E F I K N T M D D I R N I I N I A N I A P K T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
Y L Y T A D D W K F E V L K I M M E N K G A P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
N K M M P L I M K N A E L R R Y G K E I P K L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
N E I V K N G I S N P I D E E N I L N D A K Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
L E N E F Q C K I I V N G E D I G N K K R F A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969
P N K V A I Y I E
- - - - - - - - -
---------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_leu_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D F L N E I A S K W Q K V W D S E R V Y E A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V D R T K E K K F I T V A F P Y T N S P L H I G
- - - - - - - - F I T V . F P Y T N S P L H I G
------------------------CTCCTTTACGTC---TTTATTTAGAAGGAATTGGGCATTAGAGGTCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H G R T Y I T A D I Y A R Y L R M K G Y N V L F
H G R T Y I T A D I Y A R Y - - - - - - - - L F
AATCTCGCTCTCATTTATACCAATTTCAGCTAAGTCCTTTAT------------------------CTCATA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P F A F Q F T G T P I L S I A D A V K R G D E E
P F A F Q F T G - - - - - - - - - - - - - - - -
AGCCAACCTAGCCATTTCTTTATC------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I I S T F T N V Y Q I P I G V I S K F S D P S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L S A Y F K E D M R N T A L T L G L S I D R R R
- - A Y F K E D M R N T A L T L . . . . D - - R
------CATTTTTGACTTCATGGAGTTAATCAAATCTATTGTGTACCT------------CTC------AGC
145146147148149150151152153154155156157158159160161162163164165166167168
E F T T I D P A F E R F V Q W Q Y K R L Q E I G
E F T T I D - - - - - - - - - - - - - - - - - -
TCTCTTCTCGTATTTTAA------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y I K K E K A P V A Y C P V D E F P V G M H D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R G D I E P E I I D L D V I Y F Q G E K L L F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T A T S R P E T I F G A V A I L I N P E S D Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V V I D N K S G K R L V I S T E A F K K L S F Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
M N L T E E E R K K G E E L I G L N V T N P V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L K K L A V L P S K Y V E S K Q G T G L V M A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P A H E P L H Y L A L S E L K E S F E I V P V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K S E D Y G D F P A M E V L E T A Q T T S A Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L K D Y I D T L Y R L E F H K G S I R D E V V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L V P D Y M K Q F V R E R I A G R S V R E A R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S V V E L L R N L G V H G D I Y E I I N G P V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
C R C G A E V V V K V F D D Q W F I D Y S N S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
W K S S V L K N L D K V E I L P S D A K R E I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K I I F N M K P R P F T R S R G L G V R L P W D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D R Q I I D S L S D S T I Y T V F Y I V A N K V
- - - - - D S L S D S T I Y T V - - - - - - - -
---------------CCTACAGTAAACCGGTCCGTTTATTATCTCGTA------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K S Y P T S I L N E R F W D Y V V L G R G D S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q L S R E L G I P K E Q L E E L R K E V E Y W Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
P V D S R H S G R D L V Q N H I P Y Y L Y H H V
- - - S R H S G R D L V Q N . I P Y Y L Y H H V
---------GTAGTCCTTTAGCTCTTGTGCACTAGTAGTCTG---TGTTTCAAGAACTTCCATTGCAGGAAA
601602603604605606607608609610611612613614615616617618619620621622623624
G V L G E D K V P K R I V L N G F I R V G G K K
G V - - - - - - P . R I V L N - - - - - - - - K
ATCACC------------------CAC---AACTATCTCGAAACT------------------------ATA
625626627628629630631632633634635636637638639640641642643644645646647648
M S K S F G N V Y P L N K A I R E Y G V D T V R
M S K S - - - - - - - - - - - - - - - - - - - -
ATGTAAGGGTTC------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L A L T S T S S L S D D I E F S P N I A K S I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E Q L K H I H D F I Y N L L K L Q S V N E M R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V D L W I S S L I S E Y I D L I D N C L S N L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L R T A Y K T I Y Y D I Y E D L K D Y L E L G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
G K I N S D I V K N I I S V W V R L M A P F T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
H L A E E L W H K L D N S L V V R Q K F P V K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E L K Y E K R A L L E I E Y L R Y T I D L I N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
M K S K M P K E P E T V I I Y V N E D N M Q R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L I R K A I E S L K E R K S L L D F E K E V G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K E M A R L A Y E I A G D L P D K I K D L A E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
G I N E S E I L T S N A Q F L L N K L D V K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
Y I Y N S K D P S T P D I K G K K S I A L P Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942
P G I I L T
- - - - - -
------------------
Class I
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_leu_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E R P E E R Q W K E W E E A G L F E A D P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D R E S V Y I T V A Y P Y P S G S M H V G H A R
- - - - - Y I T V . Y P Y P S G S M H V G H A R
---------------TACATCACGGTC---TACCCGTACCCGTCGGGTTCGATGCACGTGGGTCACGCGCGG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T Y L V P D I Y A R F K R M Q G Y N V L F P M A
T Y L V P D I Y A R F - - - - - - - - L F P M A
ACGTACCTGGTTCCGGACATCTACGCGCGGTTC------------------------CTGTTCCCGATGGCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F H V T G T P V V G I A E R I K E G D E D T I R
F H V T G - - - - - - - - - - - - - - - - - - -
TTCCACGTGACGGGT---------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L Y R D L Y G V P E E E L E K F T E P E A I V E
- - - - - - - - - - - - - - - - - - - - - - - E
---------------------------------------------------------------------GAG
121122123124125126127128129130131132133134135136137138139140141142143144
Y F A R E Y E E N M K R M G Y S I D W R R K F T
Y F A R E Y E E N M K R M . . . . D - - R K F T
TACTTCGCGCGCGAGTACGAGGAGAACATGAAGCGCATG------------GAC------CGGAAGTTCACA
145146147148149150151152153154155156157158159160161162163164165166167168
T V D P E Y R S F I T W Q Y L R L R E K G L V D
T V D - - - - - - - - - - - - - - - - - - - - -
ACGGTCGAC---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K G E H P V R Y C P H C E N P V G D H D L L E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E D A T I E E L T L V K F P V E G D D L I L V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A T F R P E T L Y G A T N V W V K P D E E Y L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V E V D G E R W V V S E E A Y R N L R H Q K D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V E K V D T V R G E E L I G E S V V N P V T G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A L P V L P A E F I D P K F G T G V V Y S V P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H A P A D A A A L E D L K K D P S V L E E Y G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D P S V V E E L E P V Q V I E V E G Y G E F P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y D A L E E H G I E S Q T D P E L E K A T Q E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y R A E L H K G V M V V D E F E G T P V R E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E E I K S R L I E S G D A D V M Y D F S E K P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I C R C G T E C V V R I L K D Q W F L R Y S D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E W K E R A E E L L G R M E I V P E E V R A N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E D T I E W L D D W A C A R R V G L G T P L P W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D P D W I V E P L S D S T V Y M A Y Y T I A H R
- - - - - - E P L S D S T V Y M A - - - - - - -
------------------GAGCCGCTGAGCGACTCGACGGTGTACATGGCG---------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L K G K G E L P P E V F D Y V F L G E G D P E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I A E K A G L D V E E L E A M R E E F E Y W Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L N W R L S A K D L V T N H L T F F I F H H A A
- - W R L S A K D L V T N . L T F F I F H H A A
------TGGCGGCTCTCGGCGAAGGACCTGGTCACGAAT---CTGACGTTCTTCATCTTCCACCACGCGGCG
601602603604605606607608609610611612613614615616617618619620621622623624
L F P E D K W P K G I V V F G M G L L E G Q K M
L - - - - - - P . G I V V F - - - - - - - - K M
CTG------------------CCG---GGTATCGTCGTGTTC------------------------AAGATG
625626627628629630631632633634635636637638639640641642643644645646647648
S S S K G N V V L L S E A L D E Y G P D V V R L
S S S - - - - - - - - - - - - - - - - - - - - -
AGCTCGTCC---------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
F L A T S A E P W Q D F D W R D E Y V R G V Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
H L E R F E T L I R D H A D E S V E D K D A V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
R W F L H E F R E V V E E T T E A L E G F Q I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R A Y N R A F Y G V M K L L R E Y E A M K G H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
K I L G E I A E D W L K L L H P V I P F A T D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L W R E V L G E D S F L L E E E W P D P S E Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E E P E L S V A K E V L D R L I E D V R D V E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V I G A E P G Y T L H V Y L A P E W Q W R A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L I L K D K E F G E V M S E L M K D E G L R E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G D E V A K I V Q E L T K E D L P E D V D V D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L R E A L T E F L E A A G R A L T D K T G A S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
V V I H T D P E E A P G P E D R K A G A R P L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943
P G I W L E E
- - - - - - -
---------------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_leu_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T E E T Q A L E A A I R K Q W D G V F I A T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S E K K K F Y L T V A Y P Y P S G A M H V G H G
- - - - - - Y L T V . Y P Y P S G A M H V G H G
------------------TATCTGACCGTT---TACCCGTACCCGAGTGGGGCCATGCATGTCGGTCATGGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R T Y I V P D V V A R F W R M R G R E V L Y P M
R T Y I V P D V V A R F - - - - - - - - L Y P M
CGGACCTACATCGTTCCTGATGTTGTCGCCCGGTTC------------------------CTCTATCCGATG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A F H V T G A P V I G I S K R I A R R D E S A I
A F H V T G - - - - - - - - - - - - - - - - - -
GCATTTCATGTCACCGGT------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K L Y R D L Y R V P E D V L E T F T D P L N I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N H F S N E Y E R V M T Q A G L S I D W S R R F
N H F S N E Y E R V M T Q A . . . . D - - R R F
AACCATTTTTCAAATGAGTATGAACGGGTCATGACCCAGGCA------------GAC------CGACGGTTT
145146147148149150151152153154155156157158159160161162163164165166167168
T T V E P T Y S K F I E W Q W Y H L R E A G H V
T T V E - - - - - - - - - - - - - - - - - - - -
ACCACGGTTGAA------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N K G A H P V R Y C P Q C E N P V G D H D L L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G D K A E I Q K F T L I M F Q Y G D A F I P C A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T L R P E T I Y G V T N L W V N P T V E Y V R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R V D G K E W I L S R Q A M E K I A L Q D H E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A E I G T I P G S D L V E K K V S H P F C G E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P I L P A V F V D P D M A T G L V M S V P A H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P Y D Y I A L R D L Q R K G Q Y T D I K P V G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I T V E G Y G E F P A V E A V E K A D I I N Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D P N L V E L T Q S V Y T A E H A T G K M Y E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y G G K P V K I A R E E I A G V L I E K H H S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I M Y E F D I R P V V C R C G S R V F V K V L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N Q W F L E Y S D E A W K Q Q V K D H L E N M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L V P Q E V R A E F F R T V D W L K D W A C S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R I G L G T K M P W D P E W L I E P L S D S T I
- - - - - - - - - - - - - - - - E P L S D S T I
------------------------------------------------GAACCGCTCTCTGACTCGACCATC
505506507508509510511512513514515516517518519520521522523524525526527528
Y M A Y Y T I A S R I K H I D P A L L T P A V F
Y M A - - - - - - - - - - - - - - - - - - - - -
TACATGGCC---------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D Y I F L G K E S E G L P E R E R L D G M R K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F L Y W Y P Y D F R F S A K D L I S N H L T F Q
- - - - - - - - F R F S A K D L I S N . L T F Q
------------------------TTCAGATTCTCTGCAAAAGATCTCATCTCAAAC---CTGACCTTCCAG
577578579580581582583584585586587588589590591592593594595596597598599600
L F H H C T I F P K E C L P H G M V V F G M G L
L F H H C T I - - - - - - P . G M V V F - - - -
CTCTTCCACCACTGCACGATA------------------CCC---GGTATGGTTGTCTTT------------
601602603604605606607608609610611612613614615616617618619620621622623624
L N G A K M S S S K G N V Y L L E D A I N D F G
- - - - K M S S S - - - - - - - - - - - - - - -
------------AAGATGTCCTCGTCC---------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A D T V R M F L I G S G E P W Q D F D W R N E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
V S S T K K Q I E R F A Q T I R D G L A A D G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E T D I D R W L V S R M Q N H I S L V T T A M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
N F Q T R Q A L Q E A F F G F E S D L K W Y K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R L G Q N P A G K S A M K S L C S T W V R L L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
P I I P F T C E D L W K E I G E G L V S F A P W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
P E S D A S L V D D A A E I A E E L L V R T V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
D I E S I L R I L K T P P R K V T I C V A P S W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K W E I M T L I A G A P D K K N V I R D V M Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E E I K S R G K E A A D A V K Q C T N L F H K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
P S D L V D R I I A N K P D E L A V F K A A S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
F L A E D T K L E I E V I P A D A C Q H M K A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924
S A L P F K P A I I I E
- - - - - - - - - - - -
------------------------------------
Class I
Archaea/Archaeoglobus fulgidus/amino acid sequences/leu_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D F R I I E E K W Q K A W E K D R I F E S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P N E K E K F F L T I P Y P Y L N G N L H A G H
- - - - - - - F L T I . Y P Y L N G N L H A G H
---------------------CTCATTCTCAAT---TTTCAGGTTCTGCTGCAGAACTTCCCACTCCTTAAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T R T F T I G D A F A R Y M R M K G Y N V L F P
T R T F T I G D A F A R Y - - - - - - - - L F P
TAGCATCAGCTTCTTTCTGTCTTTGAAAATCTTCTTGAC------------------------CTTCCTAAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L G F H V T G T P I I G L A E L I A K R D E R T
L G F H V T G - - - - - - - - - - - - - - - - -
CTCCTCGTCCTGCATAAGCTG---------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I E V Y T K Y H D V P L E D L L Q L T T P E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V E Y F S R E A L Q A L K S I G Y S I D W R R V
- E Y F S R E A L Q A L K S I . . . . D - - R V
---CTCAACAAGGTTTCGGAGGTATTCCTCAATTCTCTCCGCCTC------------GGT------GTATTC
145146147148149150151152153154155156157158159160161162163164165166167168
F T T T D E E Y Q R F I E W Q Y W K L K E L G L
F T T T D - - - - - - - - - - - - - - - - - - -
TGGGTAGCTTTCGAG---------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I V K G T H P V R Y C P H D Q N P V E D H D L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A G E E A T I V E F T V I K F R L E D G D L I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P C A T L R P E T V F G V T N I W V K P T T Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I A E V D G E K W F V S K E A Y E K L T Y T E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K V R L L E E V D A S Q F F G K Y V I V P L V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R K V P I L P A E F V D T D N A T G V V M S V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A H A P F D L A A I E D L K R D E E T L A K Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I D K S V V E S I K P I V L I K T D I E G V P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E K L I R E L G V K S Q K D K E L L D K A T K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L Y K K E Y H T G I M L D N T M N Y A G M K V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E A K E R V H E D L V K L G L G D V F Y E F S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K P V I C R C G T K C V V K V V R D Q W F L N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S N R E W K E K V L N H L E K M R I I P D Y Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E E F R N K I E W L R D K A C A R R K G L G T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I P W D K E W L I E S L S D S T I Y M A Y Y I L
- - - - - - - - - E S L S D S T I Y M A - - - -
---------------------------CTTAACCAAATCCTCATGAACTCTCTCCTTCGC------------
529530531532533534535536537538539540541542543544545546547548549550551552
A K Y I N A G L L K A E N M T P E F L D Y V L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G K G E V G K V A E A S K L S V E L I Q Q I R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D F E Y W Y P V D L R S S G K D L V A N H L L F
- - - - - - - - - L R S S G K D L V A N . L L F
---------------------------TATTGGCTTTATGCTCTCTACAACGCTTTTGTC---TCCGTACTT
601602603604605606607608609610611612613614615616617618619620621622623624
Y L F H H V A I F P P D K W P R A I A V N G Y V
Y L F H H V A I - - - - - - P . A I A V N - - -
CGCCAGCGTTTCCTCGTCTCTCTT------------------CAG---AAAAGGAGCGTGTGC---------
625626627628629630631632633634635636637638639640641642643644645646647648
S L E G K K M S K S K G P L L T M K R A V Q Q Y
- - - - - K M S K S - - - - - - - - - - - - - -
---------------TGCGTTGTCAGTGTC------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
G A D V T R L Y I L H A A E Y D S D A D W K S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E V E G L A N H L R R F Y N L V K E N Y L K E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G E L T T L D R W L V S R M Q R A I K E V R E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
M D N L Q T R R A V N A A F F E L M N D V R W Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L R R G G E N L A I I L D D W I K L L A P F A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
H I C E E L W H L K H D S Y V S L E S Y P E Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E T R V D E E A E R I E E Y L R N L V E D I Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I K K F V S D A K E V Y I A P A E D W K V K A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K V V A E S G D V G E A M K Q L M Q D E E L R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
L G K E V S N F V K K I F K D R K K L M L V K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
W E V L Q Q N L K F I E N E T G L K V I L D T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932
R V P E E K R R Q A V P G K P A I Y V A
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_leu_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K L K G H D G G D S V D I E R K W R D R W R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A G I F Q A D P D D R E K I F L T V A Y P Y P S
- - - - - - - - - - - - - - F L T V . Y P Y P S
------------------------------------------ATCAGATGCATC---GAGTACGCTGTACTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G A M H I G H G R T Y T V P D V Y A R F K R M Q
G A M H I G H G R T Y T V P D V Y A R F - - - -
GTCTATCACCGTAACCTCTGATTTACCAAGGTCCCTGATGATCCTCCTTACAAATTCAGC------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G Y N V L F P M A W H V T G A P V I G I A R R I
- - - - L F P M A W H V T G - - - - - - - - - -
------------GCCCTCAGCTGAAACCCTTCCCATTATGGA------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q R K D P W T L K I Y R E V H R V P E D E L E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F S D P E Y I V E Y F S R E Y R S V M E D M G Y
- - - - - - - - E Y F S R E Y R S V M E D M . .
------------------------AACGGTATTCTGGACCATCTCCTCTGCAACCTGCACATCCCT------
145146147148149150151152153154155156157158159160161162163164165166167168
S I D W R R E F K T T D P T Y S R F I Q W Q I R
. . D - - R E F K T T D - - - - - - - - - - - -
------ATC------GTCAGGCCATGGAGCTTCTGC------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K L R D L G L V R K G A H P V K Y C P E C E N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V G D H D L L E G E G V A I N Q L T L L K F K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G D S Y L V A A T F R P E T I Y G A T N L W L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P D E D Y V R V E T G G E E W I I S R A A V D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L S H Q K L D L K V S G D V N P G D L I G M C V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E N P V T G Q E H P I L P A S F V D P E Y A T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V V F S V P A H A P A D F I A L E D L R T D H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L L E R Y G L E D V V A D I E P V N V I A V D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y G E F P A A E V I E K F G V R N Q E D P R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D A T G E L Y K I E H A R G V M S S H I P V Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G M K V S E A R E V I A D E L K D Q G L A D E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y E F A E R P V I C R C G G R C V V R V M E D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
W F M K Y S D D A W K D L A H R C L D G M K I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P E E V R A N F E Y Y I D W L N D W A C S R R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G L G T R L P W D E R W I I E P L T D S T I Y M
- - - - - - - - - - - - - - E P L T D S T I Y M
------------------------------------------CTCATCTGCAAGGCCCTGGTCCTTCAGTTC
529530531532533534535536537538539540541542543544545546547548549550551552
A Y Y T I A H R L R E M D A G E M D D E F F D A
A - - - - - - - - - - - - - - - - - - - - - - -
ATC---------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I F L D D S G T F E D L R E E F R Y W Y P L D W
- - - - - - - - - - - - - - - - - - - - - - - W
---------------------------------------------------------------------ACC
577578579580581582583584585586587588589590591592593594595596597598599600
R L S A K D L I G N H L T F H I F H H S A I F P
R L S A K D L I G N . L T F H I F H H S A I - -
AAATTTCTCTATAACCTCGGCCGCCGGGAA---ACCGTAGCCATCCACTGCTATGACATTCACGGG------
601602603604605606607608609610611612613614615616617618619620621622623624
E S G W P R G A V V F G M G L L E G N K M S S S
- - - - P . G A V V F - - - - - - - - K M S S S
------------ATC---AAGACCGTACCTTTC------------------------GTCCTCAAGGGCTAT
625626627628629630631632633634635636637638639640641642643644645646647648
K G N V I L L R D A I E K H G A D V V R L F L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S S A E P W Q D F D W R E S E V I G T R R R I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
W F R E F G E R V S G I L D G R P V L S E V T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A E P E S F I G R W M M G Q L N Q R I R E A T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A L E S F Q T R K A V Q E A L Y L L K K D V D H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Y L K R V E G R V D D E V K S V L A N V L H A W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I R L M A P F I P Y T A E E M W E R Y G G E G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V A E A P W P D F S D D A E S R D V Q V A E E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V Q N T V R D I Q E I M K I L G S T P E R V H I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
Y T S P K W K W D V L R V A A E V G K L D M G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
I M G R V S A E G I H D N M K E V A E F V R R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
I R D L G K S E V T V I D E Y S V L M D A S D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
I E S E V G A R V V I H S K P D Y D P E N K A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948
N A V P L K P A I Y L E
- - - - - - - - - - - -
------------------------------------
Class I
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_leu_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E L S S L F I K M A E K W Q A K W A E A R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y E P E P R P G A A K F F V T A A Y P Y P N G A
- - - - - - - - - - - - F V T A . Y P Y P N G A
------------------------------------TTCGTAACAGCG---TATCCCTATCCCAACGGCGCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I H I G H G R T Y L I A D V L A R F H R H M G R
I H I G H G R T Y L I A D V L A R F - - - - - -
ATTCACATTGGCCACGGGCGGACGTATTTAATTGCCGACGTGTTGGCGCGTTTT------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V V L F P M G F H Y T G T P I L T I A E A I A S
- - L F P M G F H Y T G - - - - - - - - - - - -
------CTATTCCCCATGGGATTTCACTACACGGGC------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G D A T V I E E Y M A I Y G V P K D E I E K M G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N P L Y L A R Y F H E Q S K R A M Q K F G L G I
- - - - - - R Y F H E Q S K R A M Q K F . . . .
------------------CGGTACTTCCACGAGCAGTCAAAAAGGGCGATGCAGAAATTC------------
145146147148149150151152153154155156157158159160161162163164165166167168
D W T R E F T T I D P E Y Q R F I Q W Q F E K L
D - - R E F T T I D - - - - - - - - - - - - - -
GAC------AGGGAGTTCACGACTATCGAC------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R E R G L I V R G R H P V G W C P R H S M P V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A H D T K D D K E P E I G Q W T L I Y F A D G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G L V F P A A T L R P E T V L G V T N M W I N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D A E Y A V I E H N G R K M V V S K D A A F R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S F Q G D V R I L R E A R G R E F V G R S V Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P V T G E W V P V Y E A K F V D P K V G T G V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
M S V P A H A P Y D Y A A L R D L N A V R L I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L I R V E G Y G D Y P A K E V V E R M G I K S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T D P A L E E A T R E V Y S A E Y T K G V M R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D V V G R V G A H L S E P A R S M L R A V F K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y F A G R P V R E A R E F I S K W L V E A G I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G V M Y D I M N K P V Y C R C G T E I V V K V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E D Q W F I N Y G E G R W K E L A R K L V E E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A I V P P E A K A H F L A T I D W L D K R A C A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R T R G L G T P L P W S D G W V I E S L S D S T
- - - - - - - - - - - - - - - - - E S L S D S T
---------------------------------------------------GAGAGCCTCAGCGACTCCACT
529530531532533534535536537538539540541542543544545546547548549550551552
I Y M A F Y T V I K R I R Q F G I K P E Q L I K
I Y M A - - - - - - - - - - - - - - - - - - - -
ATATACATGGCC------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E F W D Y V F L G V G T P E E V A K R T G V P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E Q L K A I R E E F D F W Y P L D S R N S G K D
- - - - - - - - - - - - - - - - - S R N S G K D
---------------------------------------------------TCCCGCAACTCGGGCAAGGAC
601602603604605606607608609610611612613614615616617618619620621622623624
L I P N H L T F F I F N H V A I F P R E K W P R
L I P N . L T F F I F N H V A I - - - - - - P .
TTAATACCAAAC---TTGACGTTCTTCATCTTTAACCACGTGGCCATA------------------CCG---
625626627628629630631632633634635636637638639640641642643644645646647648
Q I V A N G W V L R E G E K M S K S K R N V L P
Q I V A N - - - - - - - - K M S K S - - - - - -
CAAATAGTGGCCAAC------------------------AAAATGTCGAAGTCA------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L D K A V D M Y G P D P L R A T L A I T A E V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
Q D L D F R H A E A I R N A Q Q L M S I Y S L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Q R L A Q T A E D R S P N W L D K W L V S E I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L V L E R A R E A Y E K V R V R Q A A V E V L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
N A K S V F D Q Y L A S V E R P S K L A V E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
R A W A V A M E P I A P H L A E E I W S I L G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E G L V V K A P W P Q L R P D P V A L L A K R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V D M V I D D V K R I P A F G E G V K R V V I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V N P N Y A W V K A A L S G D V K A V I N A G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
P P Q A A K R V V D I V K T L G D E L R G L I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
A V G K F D E A E A L A S Y K N Y M E K A L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
P M E I Y N A D D P S A P D L G S K K K V A L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945
L R P G I Y I E K
- - - - - - - - -
---------------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_leu_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D D R G R R C C T H S G V I A L D I E A K W Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N A W D R D G I F V P K M D G R K K F M I T V P
- - - - - - - - - - - - - - - - - - - M I T V .
---------------------------------------------------------CTCGTCAAAGCC---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W P Y T N G S L H V G H G R T Y T L G D I I A R
W P Y T N G S L H V G H G R T Y T L G D I I A R
TATCATTATGTCCTTCCTGCGCTTCGCCAGGTACTGCATGTATTTCTTCGACTGGCCGGAAACACTGTTATT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y K R S R N Y N V L F P M G F H Q S G T P I L A
Y - - - - - - - - L F P M G F H Q S G - - - - -
GAG------------------------GTCGGCATTCGCCACAGTTATCTCCACCGA---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F S E R I R A G D R S T I D L Y T S Y L K E Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E K D I D A L I E S F K D P K N I A D Y F S N A
- - - - - - - - - - - - - - - - - - D Y F S N A
------------------------------------------------------GTCGAACGGATCAACCGA
145146147148149150151152153154155156157158159160161162163164165166167168
I I N D F K H L G Y S I D W T R R F T S A D E F
I I N D F K H L . . . . D - - R R F T S A D - -
CACGTATGTGTCCGATACGTAGCT------------CTC------GTGAGGTATAACGGGCATCAA------
169170171172173174175176177178179180181182183184185186187188189190191192
Y Q K F V Q W Q F R R L N E K G L V K Q G R Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I L Y S L E D D N A V G E D D I K D G D T D K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T I E E Y T A I F F R G K S F D L I A A S L R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E T I Y G I T N I W V N P D V K Y V K V K I S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R M A V V S E E C S T K L K F Q G N E I E V A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E A S V Q E I Q K Q T Y T T P A G K E V K V Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A D F V D P D N G T G I V Y S V P S H S V Y D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V Y Y R K K R G K D F P V I I E A P M K M K D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E S K Y D L E T E E G R E E A T K D L Y R N E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y Y G K L V D S G P Y T G M T V R E A R E A V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R D L I S S G N A F T F Y E T S R H A V T R S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S K V I V A V L P D Q W F L D Y S Q P W L K D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G H T M I N T M T M H P E V Y R N V M N D A I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
W L K E R P C A R R R G L G T R L P F D D R W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I E S L S D S T I Y P A V Y T N S I P L R S L Y
- E S L S D S T I Y P A - - - - - - - - - - - -
---CGCCTCCCGCGCTTCCCTCACGGTCATGCCGGT------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E T G K L D D D A I T R I F M N G E P K N E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
S E A K R Q F E Y W Y P V D I R L T A I P H I S
- - - - - - - - - - - - - - I R L T A I P H I S
------------------------------------------CTTTCCGCGCTTCTTCCGGTAATACACGTA
577578579580581582583584585586587588589590591592593594595596597598599600
N H L S F Y V L N H A A I F P K E K W P A G L I
N . L S F Y V L N H A A I - - - - - - P . G L I
ATC---AACAGAGTGCGACGGTACGGAATACACTATCCC------------------CAC---ATCGGCCTG
601602603604605606607608609610611612613614615616617618619620621622623624
I S G L V V S N G A K I S K S K G N V V S L L E
I S - - - - - - - - K I S K S - - - - - - - - -
GTATAC------------------------GGTGTAGGTCTGCTT---------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
I A K K Y S A D I Y R L Y V A V Q A D I S S T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D W N E T D L A S I T R R F N E F K D L M A G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
K Q D T S D L T F E E A W F V A R F S V R L R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
F M E S M D R Y Q I R D A Y I N I F Y G V L N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L R Y L S S R G G D V N R A L T P V I A D W L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A L M P V I P H H A E E Y W H S Y V S D T Y V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
V D P F D E N F Q D R Y E R T V R R F G M T C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
Q M Y S A M D Y V E K V L Q D V K N I M Q V T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I E P K S V E I T V A N A D V V R A A Q E F L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
N S V S G Q S K K Y M Q Y L A K R R K D I M I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G F D E Y D V L Q R N Q V Y L S K Q I G C P V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910
I E R G D V I N G K I A L P G K P V I Y I S
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_leu_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K F F V T A A F P Y V N G Y L H L G H L V T
- - - - F V T A . F P Y V N G Y L H L G H L V T
------------TTTGTAACAGCA---TTCCCATATGTAAATGGTTATTTACATTTGGGCCATCTAGTAACA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y I K A E I T A R Y K K M R G Y D V L F P M G F
Y I K A E I T A R Y - - - - - - - - L F P M G F
TACATAAAAGCAGAAATTACAGCAAGATAC------------------------TTATTCCCAATGGGCTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H A T G A P I Y A A A Y K V S I G D P K Q I E T
H A T G - - - - - - - - - - - - - - - - - - - -
CATGCTACTGGT------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L K K M G I K D I E K F K D P A Y W V E Y F S K
- - - - - - - - - - - - - - - - - - - E Y F S K
---------------------------------------------------------GAGTATTTCTCTAAA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A A K E D L S K L G F M I E W E R S F T T V F N
A A K E D L S K L . . . . E - - R S F T T V - -
GCAGCAAAAGAGGATTTATCTAAATTG------------GAA------AGATCTTTTACCACAGTA------
121122123124125126127128129130131132133134135136137138139140141142143144
K P F H K F V E W Q Y H R L R E K G Y I Y R G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
H P I V W D P K V N M V I G D H D R P D D Y A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I R P I E G V I I K F Y S K D L D A Y L P A F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L R P E T V F G V V N I W V N P E T E Y V L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V K K V F Y V Y E L Y S L Y K K F G R L P L N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E N R D K L E K L I Q D Y N N L L D R L K Q Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K G I D L I A H A E E I A Y K P K E E F V K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K E F A E K E G I K I E E K D I E L L Y E Y Y N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T K V E T Q E E K W I L P N T I V I E E L K N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D F E I E I I G K I D K L I K T L A E N P V T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E L V P V L P A K F V D P E V G T G I V M S V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S H A P Y D Y V G L L D L I K T E L K E F A E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A L K N V R P V V K V E G F S E M P A K D I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S M N I T S Q E E R D K L E K A T Q R L Y S K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F Y H G V L T E H A Q Q F Q G L P V K E A K M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I A E Y L M E N G Y G Y I Y Y T L P V R F K S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Y G N K V V V K L V K G Q W F I K Y S D K Q W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E L A H K A V E N M K F Y P P Q V K E L I K E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I D W Y D D W A F T H Q K E L G T A L P W D P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
W V I E S L S D S T I Y T A Y Y T I A H I L Q H
- - - E S L S D S T I Y T A - - - - - - - - - -
---------GAATCCCTCTCTGATTCTACAATATACACAGCT------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
P E K Y N I D W D K L T I D V F D Y V F L G K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D P K E I A K K T G I S E E I L K E M R N Q F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y W Y P V D I R F S A Q D L I A N H L V F Y I F
- - - - - - I R F S A Q D L I A N . L V F Y I F
------------------ATAAGGTTTAGCGCCCAAGATTTAATAGCAAAC---TTGGTATTCTATATATTC
673674675676677678679680681682683684685686687688689690691692693694695696
H H V A I F P E S K W P R G I A V S G F V T V N
H H V A I - - - - - - P . G I A V S - - - - - -
CACCATGTAGCAATT------------------CCC---GGTATAGCAGTTTCT------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G E K M S K S K G N F I T I R E A I Q R Y G R D
- - K M S K S - - - - - - - - - - - - - - - - -
------AAGATGTCTAAAAGC---------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A V R L A A A Y A G N A E L V D Q N I D L E F M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E K A K N E I I P R I E S Y L D M E G Y D R D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
N S L D K W I V N R I R L Y F K K L E E Y Y E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
I R P R D V I N E F F K L E N D F N F Y R A L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L E K P H K R A I E Y F K K A V K A L W P I I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
H V V R E P A W I G K E E P D E P W I R V G Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V D Q V I K D L A N T L K L V R I S M A R N V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
H R L A D L V K L Y Y E G A K L T E E E K E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
R E F I E W K P V R I K I I Y K N P S E F D I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
R D I I P Y I E K V F G G K V V L E L A S E S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977
E E K A K R A K E F K P A F V I E
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_leu_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E Q D Y K P H E I E E K W Q K K W N E S L I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q A D P D K R E K F F I T I P Y P Y L N G N L H
- - - - - - - - - - F I T I . Y P Y L N G N L H
------------------------------TTCATAACAATC---TACCCATACCTTAACGGGAACCTGCAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A G H T R T F T I G D V V A R H K R M L G Y N V
A G H T R T F T I G D V V A R H - - - - - - - -
GCAGGACATACCCGGACCTTCACCATCGGCGACGTGGTGGCAAGGCAC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L Y P M G F H V T G T P I V G L A E L I A S R D
L Y P M G F H V T G - - - - - - - - - - - - - -
CTTTACCCTATGGGTTTCCACGTAACCGGC------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P Q T M D V Y E H L H G I P G D I L P T L D T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E K I V D Y F K R E A E K A M R M I G Y S I D W
- - - - D Y F K R E A E K A M R M I . . . . D -
------------GACTATTTCAAGCGGGAAGCCGAGAAAGCTATGCGCATGATC------------GAC---
145146147148149150151152153154155156157158159160161162163164165166167168
R R K F T T T D P T Y K K F I E W Q Y I R L E E
- R K F T T T D - - - - - - - - - - - - - - - -
---CGCAAGTTCACGACAACCGAC------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K G L I V K G S H P V K W C P N D N N P V E D H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D I L Y G E E A T I V E Y T L I K F R Y N D L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L P C A T L R P E T T F G V T N L W V N P D V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y V K A R V E K D G N E E F W V V S K E A F R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L T F T D R T V E Y V E D V P A K S I I G I K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T N P I T G D E V I S L P A S F V K P E N G S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I V M S V P A H A P F D Y L A L R D L Y D A D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S E Y G I T E D L R D I K L I S L I Q V P E F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E F P A K E I V E S M G I A N Q K A P K A E E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T K I V Y R R E F H G G V L K E I T G K Y R G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P V S K I K D V L T R D L I A S N A G E T F Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F S E P V V C R C G T P C V V N M V K G Q W F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N Y S N P E W K A K V Y K C L S Q M R I I P E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y R V E F E N K V D W L K D K A C A R R K G L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T R L P F D K E W L I E S L G D S T I Y M S Y Y
- - - - - - - - - - - E S L G D S T I Y M S - -
---------------------------------GAGTCCCTCGGGGATTCGACAATCTACATGAGC------
529530531532533534535536537538539540541542543544545546547548549550551552
I I A R F L E R G D L A L E Q L T L S F F D Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L L G I G D S A A V S A E T G L K Q E L V E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R S H F N Y W Y P V D L R S S G K D L V P N H L
- - - - - - - - - - - L R S S G K D L V P N . L
---------------------------------CTGCGTTCTTCCGGAAAGGACCTTGTCCCTAAC---CTG
601602603604605606607608609610611612613614615616617618619620621622623624
L F F L F H H V A L F E E E K W P R A L A V N G
L F F L F H H V A L - - - - - - P . A L A V N -
CTCTTCTTCCTCTTCCACCACGTAGCCCTC------------------CCA---GCCCTTGCAGTAAAC---
625626627628629630631632633634635636637638639640641642643644645646647648
F V S L E G Q K M S K S K G P I L T L E S A V S
- - - - - - - K M S K S - - - - - - - - - - - -
---------------------AAGATGAGCAAGTCC------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A Y G A D I T R M Y I L S T A E Q T Q D A D W Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
K T G I D S A R R Q V D R F Y S F A K D V I E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G K R A T L S T E L K L I D R W M L S R M Q K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
I M E T N I A L D S I Q T R E A I Q N S F F L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
I N D V R W Y Q R R G G E A L L Y Y V L D N W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
R L M A P F T P H L C E E I W E A M G H E D P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
S L A Q Y P L D N E D L I D E G A E L A E E A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K S T L N D I E E I V R V T K M T P Q K V Y L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
T A P A W K A E A I R C A C E L Q I E A P L E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G A L I K T L M A N P E L K R F G K E I P K F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
Q K I I P E F K S G G A E R Y E T F A Y L G L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
E Q A L L K E S A S F L E K E I G C P V E I Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
A D S P E Y D P Q K K S R F A E P L R P A I Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961
E
-
---
Class I
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_leu_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M M V M I D F K E I E K K W Q K R W E E A K I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E A N P D D R E K F F I T A A F P Y L N G V L H
- - - - - - - - - - F I T A . F P Y L N G V L H
------------------------------TTTATAACTGCG---TTTCCATATTTAAATGGAGTTTTGCAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A G H L R T F T I P E V V A R F Q R M K N K N V
A G H L R T F T I P E V V A R F - - - - - - - -
GCTGGACATTTAAGAACTTTCACTATCCCAGAGGTTGTTGCAAGATTC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L W T F G Y H V T G T P I L G L A E L I K N R D
L W T F G Y H V T G - - - - - - - - - - - - - -
TTATGGACTTTTGGTTATCATGTTACAGGA------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E K T I W A Y T E L H G I P K E E L L E L T T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E K I V E Y F S K K A E E A F K R M G F S L D W
- - - - E Y F S K K A E E A F K R M . . . . D -
------------GAATATTTCTCAAAGAAAGCTGAAGAAGCATTTAAAAGAATG------------GAT---
145146147148149150151152153154155156157158159160161162163164165166167168
R R N F K T D D K V F N K F I E W Q F H K L K E
- R N F K T D D - - - - - - - - - - - - - - - -
---AGGAACTTTAAAACGGATGAT------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K G L I V K G S H P V R Y C P R C D N P V E D H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D I L V G E N A T L V E Y I L I K F T T E D G C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I M P M A T L R P E T V F G V T N V W V N P E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T Y V K A K V Y L E K E T E N G I E L I E N G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
W I M A K E C A E K L K H Q D R K I E I I E E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K G E Q L I N K K V K N P V T G K E V P I L P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K F V K T N I G T G C V M S V P A H A P Y D Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A L R D L G L V D E I G L I P L I N V P G Y G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y P A K E I V E K M G I K S Q E E E D K L E E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T K K I Y K D E F H K G V L N E N C L D Y E G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P V R E I K D K L T K D L I D K G L A E I M Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F S E E K V I C R C G T P C I V K M V K G Q W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I K Y S D E K W K E L A H K C I D K M R F I P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N L R Q V F H E K I D W M K D K A C V R R R G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G T K F P F E E G W V I E S L S D S T I Y P A Y
- - - - - - - - - - - - E S L S D S T I Y P A -
------------------------------------GAATCTCTATCTGATTCAACAATTTATCCAGCA---
529530531532533534535536537538539540541542543544545546547548549550551552
Y T V A K Y I N Q H N I K P E Q L T L E L F D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V F L G K G D V D K I A K E T G I P K D I I E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
M R K E F I Y Y Y P V D W R C S A K D L I P N H
- - - - - - - - - - - - W R C S A K D L I P N .
------------------------------------TGGAGATGTTCAGCTAAGGATTTGATTCCAAAC---
601602603604605606607608609610611612613614615616617618619620621622623624
L T F Y I F N H V A I F P E E F W P R G I V V N
L T F Y I F N H V A I - - - - - - P . G I V V N
TTAACATTCTATATCTTTAACCACGTTGCAATA------------------CCA---GGGATAGTAGTTAAT
625626627628629630631632633634635636637638639640641642643644645646647648
G Y V T I E G K K L S K S K G P V L P V L E V A
- - - - - - - - K L S K S - - - - - - - - - - -
------------------------AAGTTATCTAAGTCA---------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E K F G A D V G R F Y I T T C A E L P Q D A D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
K F K E M E N T K K V L E R L Y L F A K E I A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
R R G E T G E E F S Y I D K W L L S R L Y K A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
K Q Y D E Y M E N F E L R K A G I L L Y Q L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D L K W Y R R R G G N N I R V L E E F L E V I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
K L M M P F T P H L C E E M W E I L G K E G F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
S L A K F P E V K E E F I N D E I E K G E E Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K A V M E D I K E I I N V A K V Q P K R I Y L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
T A D D W K Y E I L K I I K E N E G K T I K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
M P I I M K N P E F R K Y G K E I P K L V N Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
I K L N A E I I N E V E V L E N A K E F L K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
V G V E D I I I N G E D K A N K K R V A I P F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942
P A I Y L E
- - - - - -
------------------
Class I
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_leu_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N E F A E K L Y K I A R K W Q E R W L R S R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F E A D P D E S K P K F F I T A A F P Y P N S P
- - - - - - - - - - - - F I T A . F P Y P N S P
------------------------------------TTCATAACCGCG---TTCCCCTATCCCAATAGCCCG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L H L G H S R T Y T I T D A Y A R F M R M R G Y
L H L G H S R T Y T I T D A Y A R F - - - - - -
CTGCATCTGGGGCATAGCAGAACATACACCATAACGGATGCGTACGCGCGCTTC------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N V L F P M G F H F T G T P I L T M A E A I A N
- - L F P M G F H F T G - - - - - - - - - - - -
------CTGTTCCCGATGGGCTTCCACTTCACCGGC------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G D K D L I D L M I N V Y D V P P E D I D K L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D P L S L A R Y F S R D A K Q A M I E S G Y S I
- - - - - - R Y F S R D A K Q A M I E S . . . .
------------------AGATACTTCAGCCGCGACGCAAAGCAGGCGATGATAGAGTCC------------
145146147148149150151152153154155156157158159160161162163164165166167168
D W R R E F T T I D E E F K K F I V W Q F T R L
D - - R E F T T I D - - - - - - - - - - - - - -
GAC------AGAGAGTTCACAACAATAGAC------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K E K G L L K K G T H P V G W C P V H N M P V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
M H D T K G D V E P E I G E F T L I L F E L E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G L Y L P A A T L R P E T V F G V T N V W V N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A A D Y V I V A I D G R R Y V V S E R A A F K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R F Q R D N V V V E R K L R G E E L L G R R V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N P A T G R A V P I L P A D F V D P N T A T G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V M S V P A H A P Y D Y V A L E E L K R E K L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T L K K L G V D P A E L E P I P L I R V K G Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E I P A R D I V E K M G I K S Q L Q R K L L D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A T R K L Y S D E Y H S G I V R E D I L N Y I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P D M P E P Y R S F A I A P V K A W I A G R S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P E A R D A A A R W L A A L G Y G D R M Y E I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N R P V Y C R C G N E I V V K V L K D Q W F I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y G N P E W K K L A Y E L L N S M R V V P D E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R E E F V K T I E W L H E R A A A R T R G L G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E L P W S K G W I I E S L S D S T I Y M A F Y T
- - - - - - - - - - E S L S D S T I Y M A - - -
------------------------------GAAAGTCTAAGCGACTCTACAATATACATGGCG---------
553554555556557558559560561562563564565566567568569570571572573574575576
V I H K I R R Y G L K P E Q L T T G F W D Y V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L G K G D P D K V S E K T G I G R D V L E D L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R E F N Y W Y P L D S R H S G R D L V P N H L T
- - - - - - - - - - S R H S G R D L V P N . L T
------------------------------TCGCGGCATAGCGGTAGGGACCTGGTGCCGAAC---CTAACG
625626627628629630631632633634635636637638639640641642643644645646647648
F F I F N H A A I F P R E K W P R Q I V V N G F
F F I F N H A A I - - - - - - P . Q I V V N - -
TTCTTCATATTCAACCATGCTGCCATC------------------CCT---CAGATAGTGGTGAAT------
649650651652653654655656657658659660661662663664665666667668669670671672
V L L E G K K M S K S L R N I I P L R R A L R V
- - - - - - K M S K S - - - - - - - - - - - - -
------------------AAGATGAGTAAGAGC---------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
Y G A D T V R A T L L A A A E L L Q D A N F S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E L A R S V M D R L R R F E S Y A Q R A R E A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
G E E T V A D R W L R S I L Q R R V E E V T K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
F E E L R T R A A T V T V L Y E M S N D V V K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L E I R G G E P G P A L R E Y I E A W T K M L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P I A P H I A E E V W H E I L G K E S F V S L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K W P S P D P S R R D L Q A E L M V A Y V D R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V E D V K S I L R V Y K G E P R R L V V A V A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
P S S W R I A R I V A A H V A R R S Q L R D A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
H A A I E A G A P G K E A A R L V R R L Y E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
Q S V D E E L L S L I E G V D V F D E K Y A I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
A M R D Y I S A K T R I R E I S V Y Y V E E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981
G R L P E S K L N Q V T P L R P A I L I E
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_leu_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T Y Q P R E I E E K W Q D R W A E G G R Y H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D P E P D A D E D A T F V T V P Y P Y P S G G M
- - - - - - - - - - - F V T V . Y P Y P S G G M
---------------------------------GATGTAGCCGGC---CGTCTCGTACAGTTCGGTCTCGTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H I G H A R T Y T V P D V Y A R Y R R L Q G D N
H I G H A R T Y T V P D V Y A R Y - - - - - - -
GACCTCGTCGAGCGCCGCGAGTTCGTCGTCCTCGCGCTCGCGGACGTCCGC---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L F P I A W H V T G T P I I G A V N R L Q K G
- L F P I A W H V T G - - - - - - - - - - - - -
---GACCGCGTCACCCTTCTCGCGCAGCGACTC---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E E Q L S V L R D T Y N V P E D E L E T L E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P M G F A R Y F I E N H Y K E N M Q S L G L S I
- - - - - R Y F I E N . Y K E N M Q S L . . . .
---------------GTCGATGACCTCGCGCAC---GTCCGCCAGGTTCTCGACCAGTCG------------
145146147148149150151152153154155156157158159160161162163164165166167168
D W R R E F T T N D E R Y S K F V T W Q Y E T L
D - - R E F T T N D - - - - - - - - - - - - - -
CAC------TGACTCCAGGTCGGCGTCCGG------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R D H G R L E K G L H P V K Y C T D E E N P V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T H D I L E G E E A E F Q E Y T L V K F G H G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T V V P M A T L R P E T V R G V T N A Y I D P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A D Y V E A E V D G E R W L V S D E A A E K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L Q Q R D V R I L D R F T G D R L V G E R V T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P V T G E D V L V L P A D F V D A D N A T G V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
M S V P A H S P D D W V A L E E A K A D D D R M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R E Y G I D P A D V D A I E P K A I I D V E A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D D E F P A R A A V A E H G I E S S D D P A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D A T Q Q V Y N R E F H S G T L K E M Y G E Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G E V V E D V R D E L A D H F Q A S G E F D T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y E F S E E V V C R C G G E V E V A K Q D T W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L T Y S D E D W K E L A H D A I A D L D A I P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N T R D Q L D H T V D W L N E W P C I R N Y G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G T R L P W D D D F V I E P L S D S T V Y M S Y
- - - - - - - - - - - - E P L S D S T V Y M S -
------------------------------------CGTGTCGAACTCCCCGCTGGCCTGGAAGTGGTC---
529530531532533534535536537538539540541542543544545546547548549550551552
Y T I A H R L E D V P P E E L D R E F F D T L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y G A D A V D D P D E T A L D L R E E W D Y W Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
P V D Y R I S G N D L I S N H L T F Y L F H H T
- - - Y R I S G N D L I S N . L T F Y L F H H T
---------GGCCCGCGCCGGGAACTCGTCGTCGTAGGCCTC---GTCGATGATGGCCTTCGGCTCGATGGC
601602603604605606607608609610611612613614615616617618619620621622623624
D L F D E S K W P E G I A V A G M G L L E G K A
D L - - - - - - P . G I A V A - - - - - - - - A
GTCGAC------------------GTA---CCGCATCCGATCGTC------------------------GAC
625626627628629630631632633634635636637638639640641642643644645646647648
M S S S S G H V V L P T E A I E E Y G A D T V R
M S S S - - - - - - - - - - - - - - - - - - - -
CCAGTCGTCCGG------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
F F L L N S A E P W Q D F D W R G D E V G T T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
D Q L A R F H E R A Q D V I E S E A G E R D L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
R I D R W L L S K L Q S T V R D A T E A M D E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Q T R K A S Q E A F Y H F E E H L T W Y R K R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D L D R P G A R W T L Q E V L Q T R L R L L A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I V P F L A N E L H E Q L T G D P V E D A A W P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E P D A D L E S A R V E V E E R L V E N L A D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V R E V I D V T G T D P D S I A I Y T A A P W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
H R V Y E T V R E T G P D V G A V M G K V M Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E S L R E K G D A V N D L A Q D L V A D V R E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
E D D E L A A L D E V D E T E L Y E T A A G Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
A R E F D A S V D V V A E Q D A D A D R A S R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946
V P F R P A I D L E
- - - - - - - - - -
------------------------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_leu_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K Y E F I K I E K K W Q E F W D N N K T Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V E E D P S I P K E K R L Y I L D M F P Y P S A
- - - - - - - - - - - - - Y I L D . F P Y P S A
---------------------------------------TATATACTTGAC---TTCCCCTATCCTTCTGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N G L H V G H P E G Y T A T D I F G R Y K L L N
N . L H V G H P E G Y T A T D I F G R Y - - - -
AAC---CTTCATGTTGGTCATCCAGAAGGATACACAGCAACAGACATATTTGGAAGATAC------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G F H V L H P I G F D S F G L P A E N Y A I Q T
- - - - L H P I G F D S F G - - - - - - - - - -
------------CTTCACCCAATAGGATTTGATAGCTTTGGA------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G T H P Q K S T E E N I N K F K K Q I K A L G F
- - - - - - - - E E N I N K F K K Q I K A L . .
------------------------GAAGAAAATATTAATAAGTTTAAAAAACAAATAAAAGCTTTG------
121122123124125126127128129130131132133134135136137138139140141142143144
A Y D W D R E I R T H E E N Y Y K W T Q W I F L
. . D - - R E I R T H E - - - - - - - - - - - -
------GAT------CGAGAAATTAGAACACATGAG------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q L Y K K G L A Y V K E M P V W Y C P E L G T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L A N E E I I Q T S D G P K S E R G S Y S V E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K Y L R Q W V L K I T K Y A E R L L D D L E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E W P E S V K E M Q R N W I G K S T G V E I E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E I E G H S D K I K V F T T R P D T I F G I T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L V I A P E N K L I E K I T K N N F K Q N V L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y V K H E E L K S D L N R T S L E K D K S G V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T G S Y A F H P I T N E K I P I W V G S Y V L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T Y G T G A V M G V P A H D E R D F Q F A K K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q L K I L P V I S K S G K N E I L E K A F V D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G I S I N S P N E F N N L K N S E V K D K V I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W L T K N K K G K E K V A Y K L R D W I F S R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R Y W G E P I P I L F D K L G N A I P L E E N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L P L K L P E I A N Y K P S G T G E S P L S R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K D W V N V K D M G F T R E T N T M P Q W A G S
- - - - - - - - - - - - - - - - - - P Q W A G S
------------------------------------------------------CCTCAATGGGCAGGCTCT
505506507508509510511512513514515516517518519520521522523524525526527528
C W Y Y L R Y L D P K N S K E F A N K K K I E Y
C W Y Y L - - - - - - - - - - - - - - - - - - -
TGTTGGTATTATTTA---------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
W M P V D L Y I G G A E H T V L H L L Y S R F W
- - - - - L Y I G G A E H T V L . L L Y S R F W
---------------CTATACATAGGCGGAGCTGAACATACAGTATTA---CTGCTTTACTCAAGGTTTTGG
553554555556557558559560561562563564565566567568569570571572573574575576
H K V L Y D L G Y V N T K E P F K K L I N Q G I
H K V L - - - - - - - - - - - F K . L I N Q - -
CACAAGGTTCTT---------------------------------TTTAAA---CTAATAAATCAA------
577578579580581582583584585586587588589590591592593594595596597598599600
I T S F S Y Q K E N G V L I P N D Q V I E K D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K F F D K K D N K E V T Q V I A K M S K S L K N
- - - - - - - - - - - - - - - - K M S K S - - -
------------------------------------------------AAAATGTCAAAATCT---------
625626627628629630631632633634635636637638639640641642643644645646647648
V I N P D D I I K E F G A D S M R I Y E M F M G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
P L T D S K P W N T K G I I G V F R F L N K I W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
N L R E K E L S K E N P P R E I I S E L H K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
K K V T E D T E K L N F N T A I S A M M I F I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E L L K Y E K N Y L N I F K P F I I I L S P Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
P H L A E E L W E Y I G E L P S L F K N S K W P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
K F D E S L I I K G K K E I V L Q I N G K I K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K I L L N K E T G E K E L K E I A M E N S K I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
S N L L N K K I V K I I V I K N K L V N I V I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_leu_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S F D H Q T I E K K W Q D Y W L K N K T F A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R E D K S K P K F Y A L D M F P Y P S G A G L H
- - - - - - - - - Y A L D . F P Y P S G . G L H
---------------------------CAGCTCTTCAAG---TTCTTTGTCCGCGTCGGC---AACGTTCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V G H P E G Y T A T D I L S R M K R M Q G Y N V
V G H P E G Y T A T D I L S R M - - - - - - - -
CTTCGCTTTCACCTTTCCGTTCAGCTGAACGACGATTTCAATTTCATC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L H P M G W D A F G L P A E Q Y A L D T G N D P
L H P M G W D A F G - - - - - - - - - - - - - -
GACAGGCCATGCTTCATACGCGATCGTTTC------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A V F T E Q N I D N F R R Q I R A L G F S Y D W
- - - - E Q N I D N F R R Q I R A L . . . . D -
------------AAGCAATTTCACGAAGCCTTCCATGTATTCTTTCGGAAGCTG------------TGC---
121122123124125126127128129130131132133134135136137138139140141142143144
D R E V N T T D P D Y Y K W T Q W I F L K L Y E
- R E V N T T D - - - - - - - - - - - - - - - -
---GATGAAGACCATCAGCTGTGA------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K G L A Y V D E V P V N W C P A L G T V L A N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E V I D G K S E R G G H P V E R R P M K Q W M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K I T A Y A D R L L E D L E E L D W P E S I K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
M Q R N W I G R S E G A H V H F A V D G T D E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F T V F T T R P D T L F G A T Y A V L A P E H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L V Q K I T T P E Q Q D A V D A Y I E E V Q S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S D L E R T D L A K T K T G V F T G A Y A V N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A N G E K I P V W I A D Y V L A T Y G T G A V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A V P A H D E R D H E F A S A F G L P I K E V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K G G D V E K E A Y T G D G E H I H S D F L N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L D K A A A I E K M I Q W L E E N G K G E K K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T Y R L R D W L F S R Q R Y W G E P I P V I H W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E D G T S T P V P E E E L P L I L P K T S E I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P S G T G E S P L A N I K E W V E V T D P E T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K K G R R E T N T M P Q W A G S C W Y F L R Y I
- - - - - - - - - - P Q W A G S C W Y F L - - -
------------------------------TCCGTTTGCCGGATTAACCGCATATGCACCTGT---------
505506507508509510511512513514515516517518519520521522523524525526527528
D P K N P N E L A S P E K L Q E W L P V D M Y I
- - - - - - - - - - - - - - - - - - - - - M Y I
---------------------------------------------------------------GGCGTTGAC
529530531532533534535536537538539540541542543544545546547548549550551552
G G A E H A V L H L L Y A R F W H K F L Y D I G
G G A E H A V L . L L Y A R F W H K F L - - - -
TGCGTCTTTCTGTTCAGGCGTTGT---TTTTTGAACCAAATCATGCTCCGGAGCCAGCAC------------
553554555556557558559560561562563564565566567568569570571572573574575576
V V P T K E P F K Q L Y N Q G M I L G E N N E K
- - - - - - - F . Q L Y N Q - - - - - - - - - K
---------------------CGT---GAAAACCGTAAACGT---------------------------AAC
577578579580581582583584585586587588589590591592593594595596597598599600
M S K S K G N V V N P D E I V E T H G A D T L R
M S K S - - - - - - - - - - - - - - - - - - - -
ATGCGCCCCTTC------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L Y E M F M G P L D A S I A W S T T G L D G A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
R F L D R V W R L F I D D N G G L N E K I V E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A G E T L E R V Y H E T V M K V T D H F E G L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F N T G I S Q L M V F I N E A Y K A D Q L P K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Y M E G F V K L L S P V A P H L A E E L W S R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
G H E E T I T Y E A W P V Y D E A K L V D D E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E I V V Q L N G K V K A K L N V P A D A D K E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L E E L A K N N E K V K E Q L E G K T I R K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804
A V P G K L V N I V A N
- - - - - - - - - - - -
------------------------------------
Class I
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_leu_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R S A P C V A R R S K P S P N H T M H E R Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P A D V E A A A Q S D W R A A D A Y R S K E D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N R K K F Y C V S M L P Y P S G K L H M G H V R
- - - - - Y C V S . L P Y P S G K L H M G H V R
---------------TACTGCGTGTCG---CTGCCTTACCCGTCGGGCAAGCTGCACATGGGTCACGTGCGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N Y T I N D V M Y R Y L R M N G Y N T L M P M G
N Y T I N D V M Y R Y - - - - - - - - L M P M G
AACTACACGATCAACGACGTGATGTACCGCTAT------------------------CTGATGCCGATGGGT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
W D A F G M P A E N A A M A N G V P P A Q W T Y
W D A F G - - - - - - - - - - - - - - - - - - Y
TGGGACGCGTTCGGG------------------------------------------------------TAC
121122123124125126127128129130131132133134135136137138139140141142143144
D N I A Y M K K Q M Q S M G L A I D W S R E V T
D N I A Y M K K Q M Q S M . . . . D - - R E V T
GACAACATCGCGTACATGAAGAAGCAGATGCAGTCGATG------------GAC------CGCGAGGTCACG
145146147148149150151152153154155156157158159160161162163164165166167168
T C K P D Y Y K W N Q W L F L K M L E K G I A Y
T C K - - - - - - - - - - - - - - - - - - - - -
ACCTGCAAG---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K K T G T V N W D P V D Q T V L A N E Q V I D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R G W R S G A L V E K R E I P M Y Y M R I T Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A D E L L N D L D G L G W P E R V K I M Q Q N W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I G K S F G V N F G F P Y E L D G E K K L L R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F T T R A D T I M G V T F C A I A A E H P L A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R L A Q D K P E L Q A F I D E C K R G G V A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D I A T M E K K G V A T G F S V S H P L T G A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V E V W I G N Y V L M S Y G E G A V M G V P A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D E R D F A F A K K Y G L P I R Q V I A V E G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T Y S T D A W Q E W Y G D K T R A V C V N S G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y D G L A Y D A A V D A I A A D L K A G G F G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K Q I T Y R L R D W G I S R Q R Y W G T P I P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I H C P S C G D V P V P E Q D L P V V L P E D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V P D G T G N P L A K S D A F L N C A C P K C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A A A K R E T D T M D T F V D S A W Y F S R Y A
- - - - - - - - - - D T F V D S A W Y F S - - -
------------------------------GACACGTTCGTCGATTCCGCGTGGTACTTCTCG---------
529530531532533534535536537538539540541542543544545546547548549550551552
A P D A Q T M V D A R T D Y W M P M D Q Y I G G
- - - - - - - - - - - - - - - - - - - Q Y I G G
---------------------------------------------------------CAGTACATCGGCGGC
553554555556557558559560561562563564565566567568569570571572573574575576
I E H A I L H L L Y S R F W A K V M R D L G L V
I E H A I L . L L Y S R F W A K V M - - - - - -
ATCGAGCACGCGATCCTG---CTGCTGTACTCGCGCTTCTGGGCGAAGGTGATG------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A F G E P A K N L L T Q G M V L N E T F Y R E D
- - - - - A . N L L T Q - - - - - - - - - - - -
---------------GCG---AACCTGCTCACGCAG------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A A G K K T W Y N P A D V T V S F D D K G R P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G A V L K A D G Q P V V L G G I E K M S K S K N
- - - - - - - - - - - - - - - - - K M S K S - -
---------------------------------------------------AAGATGTCGAAGTCG------
649650651652653654655656657658659660661662663664665666667668669670671672
N G V D P Q M L I D H Y G A D T A R L F T M F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A P P E Q Q L E W S G A G V D G A S R F L R R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
W A F G F A N R E A L A V R A P F D V A Q L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A D K T L R R E I H G V L K Q A D F D Y Q R L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Y N T V V S A A M K M L N A I E G A K G A T P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
V L R E T Y G V L L R V L Y P V V P H V T Y E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
W K A L G Y A D E F G P L L D A P W P K V D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A L E Q A E I E L V L Q I N G K V R G A L K V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K D A S R E A I E A A A V A D E M F A K F A E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882
K P A K K I I V V P G R L V N V V V
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_leu_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S H Y D F K A I E Q K W Q Q Y W K N N Q I F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T T I E P S K P K Y Y I L D M F P Y P S G E G L
- - - - - - - - - - Y I L D . F P Y P S G E . L
------------------------------TATATTTTAGAT---TTCCCTTACCCTTCTGGTGAG---CTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H V G H P L G Y I A S D I V A R Y K R S K G Y Q
H V G H P L G Y I A S D I V A R Y - - - - - - -
CATGTAGGCCACCCACTGGGCTATATTGCCTCGGATATTGTGGCTAGGTAT---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L H P M G F D A F G L P A E Q F A I Q T G Q H
- L H P M G F D A F G - - - - - - - - - - - - -
---CTTCATCCAATGGGGTTTGATGCATTCGGT---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P A I T T A K N I G R Y K Q Q L C Q L G L S Y D
- - - - - A K N I G R Y K Q Q L C Q L . . . . D
---------------GCTAAAAATATAGGGCGCTATAAGCAACAGCTTTGCCAGTTA------------GAC
121122123124125126127128129130131132133134135136137138139140141142143144
W D R C I S T C E P A Y Y K W T Q W I F I Q L F
- - R C I S T C E - - - - - - - - - - - - - - -
------AGATGCATTAGCACATGCGAG---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N S W Y D I S L Q K A R P I D E L I T L F D Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G N Q Q V Q A S C D K E V S L F T A K E W Q A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D E E S K Q Q H L L A Y R L A F L E D T T V N W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
C P E L G T V L A N E E V K D G L S E R G G Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V I R K Q M K Q W S L R I T A Y T D R L L A G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E H L K W P L S T K E M Q R N W I G R S I G A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L N F T V I A N G Q E H T I P V F T T R P D T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F G V T Y L A L S P E H P L A K L I S T G T Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A A I D T Y I T Q A T N R S E R D R L A D V N H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V T G M F T G A Y A I H P F T K Q P L P I W I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D Y V L A G Y G T G A V M G V P A H D S R D Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F A Q H F Q L P I I Q V V A G G D T A Q S A Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A R E G S L F N S Q F L N G L S I Q E A T K Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I Q K L E S L G I G K Q K T T Y R L R N A I F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R Q R Y W G E P I P I Y Y K N N I P Y P I P A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E L P L E L P S L A S F K P T P T G E P P L G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A P N W K T K E G Y P I E L S T M P G W A G S S
- - - - - - - - - - - - - - - - - P G W A G S S
---------------------------------------------------CCAGGATGGGCAGGATCTAGT
553554555556557558559560561562563564565566567568569570571572573574575576
W Y F F R Y M D P N N E A S F V G S T A Q N Y W
W Y F F - - - - - - - - - - - - - - - - - - - -
TGGTATTTTTTT------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Q A V D L Y L G G A E H A T G H L L Y A R F W T
- - - - L Y L G G A E H A T G . L L Y A R F W T
------------TTATATTTGGGTGGAGCAGAACACGCTACAGGC---TTACTTTATGCGCGATTTTGGACT
601602603604605606607608609610611612613614615616617618619620621622623624
Q F L Y D L G Y V N I E E P F Q E L I H Q G M I
Q F L - - - - - - - - - - - F . E L I H Q - - -
CAATTTTTA---------------------------------TTT---GAGCTTATTCACCAA---------
625626627628629630631632633634635636637638639640641642643644645646647648
Q G K S S F V Y R I K G T N Q F V S Y N L R H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y E T T A M H V D I H L V K N N I L D L E R F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
N W R P D L Q T A T F V L E N G Q Y I C G S E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E K M S K S K Y N T V N P D T V V E Q Y G A D T
- K M S K S - - - - - - - - - - - - - - - - - -
---AAGATGTCTAAATCA------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L R L Y T M F L G P I E Q A K P W D M H G I E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V F R F L V K V W R L F Y L E K G A I I T N E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
P T K E V Q K A I H K A I K K V E E D I K R Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
F N T A V S N L M I C V N E L T A L K C N N R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A L T N L V L I L A P F A P H L A E E L W E I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
G H Q H S I A Q A P F P T Y E E I Y L Q E E T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E Y P I A I N G K V R A K I N F P V D M P Q G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
I E E Q V L T H E S I Q K W I Q G Q Q I K R V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923
V I S S K M V N I V I
- - - - - - - - - - -
---------------------------------
Class I
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_leu_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D V K T D K N H I E R Y D P A A I E A K W Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A K W A A D Q I Y R T P P I D P A K P K Y Y V L
- - - - - - - - - - - - - - - - - - - - - Y V L
---------------------------------------------------------------TACGTACTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D F Y P Y P S G D G L S V G H C R N Y V P T D V
D . Y P Y P S G D . L S V G H C R N Y V P T D V
GAT---TACCCCTATCCCAGCGGTGAT---CTAAGTGTGGGACACTGTCGCAACTATGTACCCACCGATGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V A R Y Y R M R G Y N V L H P M G W D A F G L P
V A R Y - - - - - - - - L H P M G W D A F G - -
GTCGCCCGCTAC------------------------CTCCATCCAATGGGATGGGACGCCTTCGGT------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T E N A A I K T K T N P A V L T R R Y S A N Y K
- - - - - - - - - - - - - - - - R R Y S A N Y K
------------------------------------------------CGCCGTTACAGCGCCAATTACAAG
121122123124125126127128129130131132133134135136137138139140141142143144
R Q M N M L G L S Y D W D R E I T S S E P D Y Y
R Q M N M L . . . . D - - R E I T S S E - - - -
CGCCAGATGAACATGCTT------------GAC------CGCGAAATTACCTCGTCTGAA------------
145146147148149150151152153154155156157158159160161162163164165166167168
H W T Q W I F L R L Y Q S W Y D R R V D K A R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I S E L E A E L A E Y G T S R L D L P L T E P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V T A E D W R N A T P L Q R Q E I L R R F R L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y R G E A V V N W D P V D K T V L A N E E V L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D G T A W R S G A K V E R R V L K Q W F F R I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A Y A D R L D R D L D T V D W P S K I V T M Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N W I G R S R G A E V I F H T E G G D P I I V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T T R P D T L W G A T F M V L S P E H P L V A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V T T E A Q R A Q V E A Y V E Q A R Q R P T T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A V A E E K E K T G V W T G G Y A I N P V N G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R I P I W I A D Y V L M G Y G T G A I M A V P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
H D E R D F A F A L K Y N L P I I P V I T R P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N A S R S L L R T E T I A A D T A D V L R A A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F T V T A Q D D G N L L V E L S G D R A H E Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T I V Q P R L C N G W T E V A G S G W L F I F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D A V I E L D S T A A D E Q I T A R L R A A T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
N V T L P S A M A Y L H S I P A Y R D I I Y H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E L G T P I H S G P I N G I A A E E A I E R T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
T Y L E Q Q G I G K G R T N Y K M R D W L I S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q R Y W G T P I P I I H R E D G L E I A L S D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E L P L T L P N V E S Y E P T A T G E S P L A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I D D W V N V T L P D G S R G R R E T D T M G T
- - - - - - - - - - - - - - - - - - - - - - G T
------------------------------------------------------------------GGAACG
673674675676677678679680681682683684685686687688689690691692693694695696
F A C S S W Y F L R F A D N H N D K A L A S P E
F A C S S W Y F L - - - - - - - - - - - - - - -
TTTGCCTGTTCATCGTGGTACTTCCTG---------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A L D Y W L P V D M Y V G G A E H A V M H L L Y
- - - - - - - - - M Y V G G A E H A V M . L L Y
---------------------------ATGTACGTCGGTGGAGCCGAACACGCCGTCATG---CTACTCTAC
721722723724725726727728729730731732733734735736737738739740741742743744
A R F W T K V L Y D L G V V K F F E P F T C L R
A R F W T K V L - - - - - - - - - - - F . C L R
GCCCGTTTCTGGACGAAGGTGCTT---------------------------------TTC---TGCCTGCGC
745746747748749750751752753754755756757758759760761762763764765766767768
N Q G L I L A P A R E V N G Q I I I E K M S K S
N Q - - - - - - - - - - - - - - - - - K M S K S
AATCAA---------------------------------------------------AAGATGTCGAAGTCG
769770771772773774775776777778779780781782783784785786787788789790791792
K G N V I T P D E V V A E H G A D A L R G Y E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
F I S D F E L S V P W N T D G V P G V K R W L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R V W R I V L Y P T A E R G Q S T T P M S E R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L R R I A H Q T I Q R V E H D I L N F K F N T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V A A L M E F T N A L Y R A R D A G L A G T P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
W Q E A I E L L L L L M A P I T P H I A E E L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
A R L G K P Y S I H Q Q R W P V A D P A I A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
E E V E I V I Q V N G K V R G K L T V P V E I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
E A Q L R E L A L N N E R V Q Q F I N G K Q I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999
S V I V V P G R L V N V V V G
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_leu_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A Y E A S L I E K K W Q K I W D E N E Y F E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K D D L N L P K K Y I L S M F P Y P S G R I H M
- - - - - - - - - Y I L S . F P Y P S G R I H M
---------------------------TAAAATTTCTTC---GCTCGCACTACTTGAAATTTCAAATTCAGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G H V R N Y T I G D A L A R Y Y R K I G F N V L
G H V R N Y T I G D A L A R Y - - - - - - - - L
CCTTTTTTTACCATTAATACTTACAGCTAAATTTAAAGTATCTTT------------------------TAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H P I G F D S F G M P A E N A A I K H K I H P K
H P I G F D S F G - - - - - - - - - - - - - - -
TTTTTTGAAATTTTTACATTTAAAAAG---------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S W T Y E N I A Y M K K E L F S L G F S F S K K
- - - Y E N I A Y M K K E L F S L . . S - - - -
---------AATAATATAAAAAGCCTCTTGCTCCAAAGCTTCATTTTTACA------TAA------------
121122123124125126127128129130131132133134135136137138139140141142143144
R M L A T S D P L Y T K F E Q E F F I K M F E K
R M L A T S D - - - - - - - - - - - - - - - - -
TTCCATACAAGCTGCAATTAA---------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G L I Y T K E A N V N W C E Q D Q T V L A N E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V E D G K C W R C G H E V V Q K K M P G Y Y V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I T A Y A E E L L K D L E E L K D K W P N Q V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T M Q E N W I G K S E G L E F S L N L D E E S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Q K T K E S S L E V F T T R A D T I Y G V S Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A L A P E H K I V Q N L L S Q N L L N Q D V L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K I K V I Q N Q S P R E R Q S S E K E G Y F L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I Y A I H P L S G E K I P L W V A N F V L A D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G S G A V M A V P A H D E R D F E F A T K Y N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A I K Q V I Q T Q E N L P Y M Q K L G K L I N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q E F D N L D C N E A R L K I I S Q F E A K N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G K R V V N F K I R D W G V S R Q R Y W G A P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P M I K C Q S C G I V P Q K L E N L P I T L P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D V Q I T G E G N P L D K H P T W K N C I C P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
C G K E A Q K E S D T L D T F F E S S W Y F A R
- - - - - - - - - - - - D T F F E S S W Y F A -
------------------------------------AGGATGAATGGCATAAATTCCTAAAAAATAACC---
505506507508509510511512513514515516517518519520521522523524525526527528
F A S D E K T W Q E K A L D E K S V K Y W M S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D Q Y I G G I E H A I L H L L Y A R F F Q K A L
- Q Y I G G I E H A I L . L L Y A R F F Q K A L
---TAAATTTTGTGAAAGCAAATTTTGAACAATCTT---TTCTGGAGCTAAAGCGATATACGAAACTCCATA
553554555556557558559560561562563564565566567568569570571572573574575576
R D L G Y L T Q N E P F D R L L T Q G M V L K D
- - - - - - - - - - - F . R L L T Q - - - - - -
---------------------------------AGA---TTCTTTGGTTTTTTG------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G A K M S K S K G N V V D P D E I I E K Y G A D
- - K M S K S - - - - - - - - - - - - - - - - -
------AGAAAATTCCAAACC---------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T A R L F I L F A A P P A K E L E W N D D A V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G A Y R F I C K L Y D R A Q N V K K G E L V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K Q E N L N K E E K Y A R L K V Y E A L K K S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E V Y H Q S F A F N T L I A A C M E A L N A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L C K N E A L E Q E A F Y I I L N I L E P I I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
H V C F E L S E E L F K C K N F K K L E L K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V F V K D T L N L A V S I N G K K R A E F E I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S S A S K E E I L A F A K E N T A K W L E G K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809
I V K E I Y V E G K L V N L V I K
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_leu_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E S R Y N P A A I E E K W Q K T W V E Q G I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K T E E N Q D K P K F Y A L S M F P Y P S G S L
- - - - - - - - - - - Y A L S . F P Y P S G S L
---------------------------------TTCTTGCATTTG---ATCGGCTTGAGCGGGAACTTGAAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H M G H V R N Y V I T D V I A R L K R M Q G Y R
H M G H V R N Y V I T D V I A R L - - - - - - -
TGTGCCTCTAGTTTTACCATTAATCTGAATTACTAATGTCATTTCATCTGC---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L H P M G W D A F G L P A E N A A I K N N I P
- L H P M G W D A F G - - - - - - - - - - - - -
---CAACCACGACTGTTTGTGAACCGATTCCTG---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P A K W T Q R N I A Q M R D Q L K R L G L S I D
- - - - - Q R N I A Q M R D Q L K R L . . . . D
---------------CAAGAGAATTAATGTTTTAATTCCTTCCGCATACACTGGAGA------------TGC
121122123124125126127128129130131132133134135136137138139140141142143144
W D K E L A T C S P D Y Y K W T Q W I F L Q F L
- - K E L A T C S - - - - - - - - - - - - - - -
------CAGGGCATTACTGAGTTTCAT---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q A G L A Y Q K E A A V N W D P V D Q T V L A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E Q V D S E G R S W R S G A K V E K K L L K Q W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F L K I T D Y A E E L L Q D L D Q L I G W P E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V K L M Q A N W I G K S T G A Y L E F P I V G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S E K I G V F T T R P D T V Y G V T Y V V L A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E H P L T R Q V T T P D R K A A V E A F I Q E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A A E S E L E R T A E D K P K R G I P T G G M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I N P F T G A E I P I W I A D Y V L Y E Y G T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A V M G V P A H D T R D F Q F A Q G N N L P I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V V I V P P N N D V E M L R V T P L Q E A Y T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P G I M V N S G S F D G T D S V K G K Q A V I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y A E K Q G W G K A R I Q Y R L R D W L I S R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R Y W G A P I P V V H C P N C G I V P V P E A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L P V R L P E D I E F T G R G G S P L A Q L S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
W V N V P C P T C G T P A K R E T D T M D T F I
- - - - - - - - - - - - - - - - - - - - D T F I
------------------------------------------------------------TACATCATTGTT
505506507508509510511512513514515516517518519520521522523524525526527528
D S S W Y F L R F P D A T N D K L V F D S A R V
D S S W Y F L - - - - - - - - - - - - - - - - -
GGGTGGCACAATGACAACCTG---------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
N D W M P V D Q Y V G G I E H A I L H L L Y S R
- - - - - - - Q Y V G G I E H A I L . L L Y S R
---------------------AGTACCGTATTCATACAATACGTAGTCAGCAAT---AATCGGAATTTCTGC
553554555556557558559560561562563564565566567568569570571572573574575576
F F T K V L R D R P K G G T E G D R N L L N F D
F F T K V L - - - - - - - - - - - - - - - - - -
ACCTGTAAACGGGTTAAT------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E P F Q R L L T Q G M V Q G L T Y M N P N K A D
- - F . R L L T Q - - - - - - - - - - - - - - -
------GCT---GGCTGCAACCTCTTG---------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K D K W V P T S I V N A D D P R D P Q T G E P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K L V Y A T M S K S K G N G V A P E E V I A K Y
- - - - - T M S K S - - - - - - - - - - - - - -
---------------CGAACTACCAACTAT------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
G V D T A R M F I L F K A P P E K D L E W D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
D V Q G Q F R F L N R V W Q L V T E F A Q Q P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V K E T S I K N P K S K I E K D L R R A I H T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
I Q A I T E D L E G E Y Q F N T A V S E L M K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S N A L A D A T C K D S P V Y A E G I K T L I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L L A P F A P H I A D E L W H A I A N Q E S V H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K Q S W L K A D P D A L V A D E M T L V I Q I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G K T R G T I Q V P A Q A D R Q M Q E K L A R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S E P A Q R Y V E G K E I K K V I V V P G K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869
N F A I G
- - - - -
---------------
Class I
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_leu_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R K V P G C V C A G A I F L L M V E R P A P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K A T A T A L V P S P I S E A E P S P I N L Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S H L M T Q E A T K P N I Q E P R A E R Y N P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A I E Q K W Q G Q W Q E S G L Y K F D E N A P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E K F Y A L T M F P Y P S G N L H I G H W Y A N
- - - Y A L T . F P Y P S G N L H I G H W Y A N
---------TACGCCCTGACG---TTCCCGTACCCCTCGGGCAACCTGCACATCGGCCACTGGTACGCCAAC
121122123124125126127128129130131132133134135136137138139140141142143144
V A P D A R A R W L R M R G Y N V L F P M A F D
V A P D A R A R W - - - - - - - - L F P M A F D
GTGGCCCCCGACGCCCGCGCGCGCTGG------------------------CTGTTTCCGATGGCTTTCGAC
145146147148149150151152153154155156157158159160161162163164165166167168
A F G L P A E N A A I K N N T N P A T W T Y A N
A F G - - - - - - - - - - - - - - - - - - Y A N
GCCTTCGGG------------------------------------------------------TACGCCAAC
169170171172173174175176177178179180181182183184185186187188189190191192
I E R M T G Q F S R M G T M I D W S R K F A T C
I E R M T G Q F S R M . . . . D - - R K F A T C
ATCGAGCGCATGACCGGGCAGTTCTCGCGCATG------------GAC------CGCAAGTTCGCCACCTGC
193194195196197198199200201202203204205206207208209210211212213214215216
D P E Y Y R W N Q W F F I E F W K R G L A Y K K
D - - - - - - - - - - - - - - - - - - - - - - -
GAC---------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G G L V N W C P K D Q T V L A N E Q V V N G H C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E R C G T A V E R R N L S Q W Y L K I T D Y A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E L L D F S A T D M P E K V R A M Q T N W I G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S V G A E V T F D T P A G P E T V F T T R P D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L M G A T F M V L A P E H A K V K E L T T D E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R A E V E A Y V A A A G R K T D V E R Q Q E G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K T G V F T G S Y A T H P I S G H Q L P I W V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D Y V L V T Y G T G S I M A V P A H D E R D F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F A K K F D L P I R E V I R A E G S E G M G D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P S E P Y S G E G Q I V N S G E F D G M P G G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A S I A A I I A R L E E R G V A K A K T T Y R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R D W L F A R Q R Y W G T P I P F V H C E K C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
M Q P V P E D Q L P V K L P E N V A F T P T G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S P L K L D E E W K T T T C P C C G G P A E R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
T D T M D T F V D S S W Y M Y R Y L S P N Y D G
- - - - D T F V D S S W Y M Y - - - - - - - - -
------------GACACCTTCGTGGACTCGAGCTGGTACATGTAC---------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G P F D P S K A G L L P V D L Y T G G I E H A I
- - - - - - - - - - - - - - L Y T G G I E H A I
------------------------------------------CTGTACACGGGCGGCATCGAGCACGCCATT
601602603604605606607608609610611612613614615616617618619620621622623624
L H L L Y S R F W T K V M R D M G L T T Q S E P
L . L L Y S R F W T K V M - - - - - - - - - - -
TTG---CTGCTGTACTCGCGCTTCTGGACCAAAGTGATG---------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
F A R L R N Q G M V L G E D G E K M S K S R G N
F . R L R N Q - - - - - - - - - K M S K S - - -
TTT---CGGCTGCGCAACCAG---------------------------AAGATGTCCAAGTCG---------
649650651652653654655656657658659660661662663664665666667668669670671672
V V D P D D L V R E Y G A D T V R A F L M F I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
P W E L G G P W D P Q G I N G P S K W L S R V W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
N V F F E E K V S G P E E K M Q G A D V R F A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
H S A L K K V N D D F E R M S F N T I I S T L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E L T N A L V K A K R S P V F G T P V W E E A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
D I F N R M L A P V V P H I A E E I W H E R G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K G S V H T A Q W P Q V D E A A A V R D T V T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G V Q V S G K V R G E V S I S K T A S Q E E A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S A A R A I A E V Q K H L E G K T V V K E I Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874
P G R I I N I V A K
- - - - - - - - - -
------------------------------
Class I
Bacteria/Escherichia coli/amino acid sequences/Ecoli_leu_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N N P G I I S T S S A R K A V L T R A F G L C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y A D L K N H I N A T F V A V L K T G P L A A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q E Q Y R P E E I E S K V Q L H W D E K R T F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V T E D E S K E K Y Y C L S M L P Y P S G R L H
- - - - - - - - - - Y C L S . L P Y P S G R L H
------------------------------TTCGCCTTTCAG---CTGCCACAGCGTGAAGCAGATGTGCGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M G H V R N Y T I G D V I A R Y Q R M L G K N V
M G H V R N Y T I G D V I A R Y - - - - - - - -
GGTGAACGGGTTAAGCATACGGACTACCGCCAGCAGCGCTTCCTGCAT------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L Q P I G W D A F G L P A E G A A V K N N T A P
L Q P I G W D A F G - - - - - - - - - - - - - -
GGTCGGTGCTTTCGCCAGTTTGTTCATCAG------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A P W T Y D N I A Y M K N Q L K M L G F G Y D W
- - - - Y D N I A Y M K N Q L K M L . . . . D -
------------GGTTACTTTAGCGATAGTTTTATGCACATCGCGACGCAGCGC------------AGT---
169170171172173174175176177178179180181182183184185186187188189190191192
S R E L A T C T P E Y Y R W E Q K F F T E L Y K
- R E L A T C T - - - - - - - - - - - - - - - -
---ATCGACGTTCAGTGCCGCAAC------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K G L V Y K K T S A V N W C P N D Q T V L A N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q V I D G C C W R C D T K V E R K E I P Q W F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K I T A Y A D E L L N D L D K L D H W P D T V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T M Q R N W I G R S E G V E I T F N V N D Y D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T L T V Y T T R P D T F M G C T Y L A V A A G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P L A Q K A A E N N P E L A A F I D E C R N T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V A E A E M A T M E K K G V D T G F K A V H P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T G E E I P V W A A N F V L M E Y G T G A V M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V P G H D Q R D Y E F A S K Y G L N I K P V I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A A D G S E P D L S Q Q A L T E K G V L F N S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E F N G L D H E A A F N A I A D K L T A M G V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E R K V N Y R L R D W G V S R Q R Y W G A P I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M V T L E D G T V M P T P D D Q L P V I L P E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V V M D G I T S P I K A D P E W A K T T V N G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P A L R E T D T F D T F M E S S W Y Y A R Y T C
- - - - - - - - - D T F M E S S W Y Y A - - - -
---------------------------GTTTGCTGCCCAAACGGGAATTTCTTCGCCCGT------------
553554555556557558559560561562563564565566567568569570571572573574575576
P E Y K E G M L D S K A A N Y W L P V D I Y I G
- - - - - - - - - - - - - - - - - - - - I Y I G
------------------------------------------------------------TTTGGTGTTACG
577578579580581582583584585586587588589590591592593594595596597598599600
G I E H A I M H L L Y F R F F H K L M R D A G M
G I E H A I M . L L Y F R F F H K L M - - - - -
GCATTCGTCAATAAAGGCGGC---TTCAGGATTATTTTCCGCCGCTTTCTGTGCCAG---------------
601602603604605606607608609610611612613614615616617618619620621622623624
V N S D E P A K Q L L C Q G M V L A D A F Y Y V
- - - - - - A . Q L L C Q - - - - - - - - - - -
------------------ACC---AAAGGTGTCCGGGCG---------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G E N G E R N W V S P V D A I V E R D E K G R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
V K A K D A A G H E L V Y T G M S K M S K S K N
- - - - - - - - - - - - - - - - - K M S K S - -
---------------------------------------------------AGTGATTTTGATAAA------
673674675676677678679680681682683684685686687688689690691692693694695696
N G I D P Q V M V E R Y G A D T V R L F M M F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
S P A D M T L E W Q E S G V E G A N R F L K R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
W K L V Y E H T A K G D V A A L N V D A L T E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Q K A L R R D V H K T I A K V T D D I G R R Q T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
F N T A I A A I M E L M N K L A K A P T D G E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
D R A L M Q E A L L A V V R M L N P F T P H I C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
F T L W Q E L K G E G D I D N A P W P V A D E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A M V E D S T L V V V Q V N G K V R A K I T V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V D A T E E Q V R E R A G Q E H L V A K Y L D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907
V T V R K V I Y V P G K L L N L V V G
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_leu_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P S Y N H A D V E R R W Q Q F W E T N K T F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T A D P G E P G T E G K P K Y Y I L D M F P Y P
- - - - - - - - - - - - - - - Y I L D . F P Y P
---------------------------------------------GTCGTCGATCTC---GGGCACCTTCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S G A G L H V G H P E G Y T A T D I L A R F K R
S G . G L H V G H P E G Y T A T D I L A R F - -
CACGGC---CTTCTTGCCGTTGATCTGAACCGGCACCTCGATCTCGTCGGCCTTCGCCAGCGCGGG------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M N N F H V L H P M G W D A Y G L P A E Q Y A V
- - - - - - L H P M G W D A Y G - - - - - - - -
------------------GGCGAGCGTGTCCGTGTGCCCCAGGGCGCG------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E K N V H P R I T T Q Q N I N T F R R Q I K A L
- - - - - - - - - - Q Q N I N T F R R Q I K A L
------------------------------TTCCAGCACCGCGCGGGGTCGCGCCTCCAGCTTGGTGGCGTG
121122123124125126127128129130131132133134135136137138139140141142143144
G F S Y D W D R E V D T T D P N Y F K W T Q W I
. . . . D - - R E V D T T D - - - - - - - - - -
------------CAT------GGAGATCGCGGTGTTGAAGCG------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F L T I Y D T W Y D P V A R K G R P I A E L P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P A E V T G Q G P D A V R K Y Q D D H R L A Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A E V P V N W C P A L G T V L A N E E V I D G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S E R G G H P V E R R P L R Q W L M R I T A Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E R L L E D L E P L D W S H S I K E M Q R N W I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G K S E G A E V E F K L A D H D A T V R V F T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R P D T L Y G A T Y M V L S P E H P L V P A I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T P S H A A A V K E Y Q Q A A A R K S D F E R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E T A K K K T G V F T G A Y A I N P L G N E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P I W I A D Y V L A T Y G T G A I M A V P G H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E R D F E F A K E F G L P I V T V V R P T D E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L A K T G S T V S D L K E P Y C E E G I A I N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G R L N G L P T A E A K R D V I V T L E G R G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G H R R V N Y K L R D W L F S R Q R Y W G E P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P V L H G A G G E L V A L S P G D L P L V P P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L E D F K P T G T P E G P L S K A T D W V N V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A G G K G F K R E T N T M P Q W A G S C W Y F L
- - - - - - - - - - - - - P Q W A G S C W Y F L
---------------------------------------CGGCACGGCCATGATCGCGCCGGTTCCGTAGGT
553554555556557558559560561562563564565566567568569570571572573574575576
R Y I D P Q N T G A F A D P A K L K H W L P I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L Y V G G A E H A V L H L L Y A R F W H K V L F
L Y V G G A E H A V L . L L Y A R F W H K V L -
GAACACGCCGGTCTTCTTCTTGGCGGTCTCGGT---CTCGAAGTCGCTCTTCCGCGCCGCCGCCTGCTG---
601602603604605606607608609610611612613614615616617618619620621622623624
D R G Y L P C P E P F Q R L V N Q G M I L G E V
- - - - - - - - - - F . R L V N Q - - - - - - -
------------------------------GGT---CGCCGGCACCAGCGG---------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E L T A Y Q K G G K W V S A N A V T D E E K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A E I K Q G P V Q T V S V T E E Q V E K K G P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F V L K E D N S I R V D S R A H K M S K S R G N
- - - - - - - - - - - - - - - - K M S K S - - -
------------------------------------------------CATCAGCCACTGGCG---------
697698699700701702703704705706707708709710711712713714715716717718719720
V V N P D D I V K E Y G A D S L R L Y E M F M G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
P L E A V K P W N T K S V E G V Y R F L S R A W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
R L I V D D M A E S L T L N P A V K D V E P D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
D T L R V L H R T I Q K V G E D T E G L R F N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A I S A M M E F V N H A T K L E A R P R A V L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
P F V L L L A P Y A P H V A E E L W R A L G H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
D T L A Y A P W P K F D P A L A K A D E I E V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V Q I N G K K K A V L K V P A E I D D A A L E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
A A R A D E A V K A A I D G K T V K M V K V V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921
R K L V N I V V V
- - - - - - - - -
---------------------------
Class I
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_leu_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S F N H R E I E Q K W Q D Y W E K N K T F R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P D D D D K P K F Y V L D M F P Y P S G A G L H
- - - - - - - - - Y V L D . F P Y P S G . G L H
---------------------------CCGCTCCTCGAG---TTCTTTTGGCAAGTCGGC---CACGTGCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V G H P E G Y T A T D I L A R M K R M Q G Y N V
V G H P E G Y T A T D I L A R M - - - - - - - -
GCGCGACCGCACTTTGCCGTTGATTTGCACGACGATTTCGACGACGTC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L H P M G W D A F G L P A E Q Y A L D T G N D P
L H P M G W D A F G - - - - - - - - - - - - - -
CGCCGGCCACGGTTCGTAGGCGATCGTGTC------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E F T Q K N I D N F R R Q I K S L G F S Y D W
- - - - Q K N I D N F R R Q I K S L . . . . D -
------------CAAGAGCTTGACGAAGCCTTCCATGTATTCTTTTTTCATTTG------------CGC---
121122123124125126127128129130131132133134135136137138139140141142143144
D R E I N T T D P N Y Y K W T Q W I F L K L Y E
- R E I N T T D - - - - - - - - - - - - - - - -
---GATAAACACCATCAGCTGCGA------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K G L A Y M D E M P V N W C P A L G T V L A N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E V I N G R S E R G G H P V I R K P M R Q W V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K I T A Y A D R L L E D L E E L D W P E S I K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
M Q R N W I G R S E G A E I E F A V D G H D E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F T V F T T R P D T L F G A T Y T V L A P E H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L V E K I T T P E Q K P A V D A Y L K E I Q S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S D L E R T D L A K E K T G V F T G A Y A I H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V T G D R L P I W I A D Y V L M S Y G T G A I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A V P A H D E R D Y E F A K T F H L P I K E V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A G G N I E K E A Y T G D G E H I N S E F L N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L N K Q E A I D K M I A W L E E H G K G R K K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S Y R L R D W L F S R Q R Y W G E P I P I I H W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E D G T M T P V P E E E L P L V L P K T D E I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P S G T G E S P L A N I E E W V N V V D P K T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K K G R R E T N T M P Q W A G S C W Y Y L R Y I
- - - - - - - - - - P Q W A G S C W Y Y L - - -
------------------------------ATCGCCGGTGACCGGGTGAATGGCGTACGCGCC---------
505506507508509510511512513514515516517518519520521522523524525526527528
D P H N D K Q L A D P E K L K K W L P V D V Y I
- - - - - - - - - - - - - - - - - - - - - V Y I
---------------------------------------------------------------GTAGGCGTC
529530531532533534535536537538539540541542543544545546547548549550551552
G G A E H A V L H L L Y A R F W H K F L Y D L G
G G A E H A V L . L L Y A R F W H K F L - - - -
AACGGCTGGCTTTTGCTCCGGCGT---GATTTTTTCCACGAGCGGATGCTCCGGCGCCAA------------
553554555556557558559560561562563564565566567568569570571572573574575576
V V P T K E P F Q K L F N Q G M I L G E N N E K
- - - - - - - F . K L F N Q - - - - - - - - - K
---------------------CCG---CGTGAAGACGGTGAA---------------------------CTC
577578579580581582583584585586587588589590591592593594595596597598599600
M S K S K G N V V N P D D I V E S H G A D T L R
M S K S - - - - - - - - - - - - - - - - - - - -
GATTTCCGCTCC------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L Y E M F M G P L E A S I A W S T K G L D G A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
R F L D R V W R L F V T E N G E L N P N I V D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
P A N D T L E R V Y H Q T V K K V T E D Y E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R F N T A I S Q L M V F I N E A Y K A E Q M K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E Y M E G F V K L L S P V C P H I G E E L W Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L G H T D T I A Y E P W P A Y D E T K L V D D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V E I V V Q I N G K V R S R L H V P A D L P K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A L E E R A L A D E K I K E Q L E G K T V R K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805
I A V P G K L V N I V A N
- - - - - - - - - - - - -
---------------------------------------
Class I
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_leu_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y N H N E I E K K W Q T R W E K T K A F K T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N K S K D K F Y A L D M F P Y P S G S G L H V G
- - - - - - - Y A L D . F P Y P S G . G L H V G
---------------------AGCTTCTTCAAT---TCTTTTTTCATCTCAATC---TTCTATTTCAAAAGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H P E G Y T A T D I I S R Y K R L K G F D V L H
H P E G Y T A T D I I S R Y - - - - - - - - L H
TTCACGTAATTTTCCATTTACTTGAATTGCTACAATATCTTT------------------------ATAAGT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P I G W D A F G L P A E Q Y A L S S G K H P Q P
P I G W D A F G - - - - - - - - - - - - - - - -
TGGTCAACTTTGAAACATAATTTC------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F T L K N I E N F R R Q L K S L G F S F D Y E K
- - L K N I E N F R R Q L K S L . . . . D - - K
------AAACATAATTGCAAAATCTTTTAAAGGTTTTAATGAATAAAT------------ATA------ATT
121122123124125126127128129130131132133134135136137138139140141142143144
E V N T T D P S Y Y R W T Q W I F K Q I Y K K G
E V N T T D - - - - - - - - - - - - - - - - - -
AACAAAAATCATTAATTT------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L A E I R E V D V N W C P G L G T V L A N E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V E N D K G E M V S E R G S F P V Y K K P M K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W V L K I T N Y A D R L L E D L N L L D W P D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L K K L Q T N W I G K E E I D G K I T Y K L Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
W I F A R Q R Y W G E P F P V Y F D E D N N V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L I D E L V E L P H M E N I M P S G T G E G P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A T N T E W V Q Y K K N N K I F K R D T N T M P
- - - - - - - - - - - - - - - - - - - - - - - P
---------------------------------------------------------------------ATA
313314315316317318319320321322323324325326327328329330331332333334335336
Q W A G S C W Y Y L A Y I M K Q E D G T Y L P I
Q W A G S C W Y Y L - - - - - - - - - - - - - -
TCAACAACTTCCTGCTCATTGAGGCATTGT------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D S K K A Y E A F S K W L P V D L Y I G G Q E H
- - - - - - - - - - - - - - - - L Y I G G Q E H
------------------------------------------------CATAATATTTTCCATATGAGGTAA
361362363364365366367368369370371372373374375376377378379380381382383384
A V L H L L Y A R F W H K I L Y D L K I V P T K
A V L . L L Y A R F W H K I L - - - - - - - - -
TTCAACAAG---ATCAATCAAATAAACATTGTTATCTTCATCAAA---------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E P F Q K L I N Q G M I L G K D G Q K M S K S L
- - F . K L I N Q - - - - - - - - - K M S K S -
------TCT---AAAAATTCAATCTTG---------------------------TTCTTCTTTTCCAAT---
409410411412413414415416417418419420421422423424425426427428429430431432
G N V V N P D E I I Q N F G A D T L R V Y E M F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
M G P L T D T K K W N E S T V E A T Y K W I L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V K R I F Q I F I E D K S K I N S L H K D D Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I S E H N L L I K E I T Q D I E D L K F N I M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S K L M I F V N S L Y K K E K I Y S L K P L K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F A I M F S T I A P H I S E E L L E S L G E K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I M F Q S W P T Y E N N K I L L T K D I V A I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V N G K L R E T F E I E N D W D E K R V I E E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K K L P N V K K H L E N K I I K K E I Y I A K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630
I L N F I I
- - - - - -
------------------
Class I
Bacteria/Mycobacterium smegmatis/amino acid sequences/Msmegmatis_leu_aa
Bacteria/Mycobacterium smegmatis/nucleotide sequences/Msmegmatis_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T E P A T T P T T P D E Q I P R H R Y N A D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A G Q I E R A W Q E T W S D R G T F N V A N P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G S L A P T D G S D V P A D K M F V Q D M F P Y
- - - - - - - - - - - - - - - - F V Q D . F P Y
------------------------------------------------CACCAGGTACTG---GTCGGCCTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P S G D G L H V G H P L G Y I A T D V Y A R Y Y
P S G . G L H V G H P L G Y I A T D V Y A R Y -
GGGGAAAGG---GTGTGCCAGCGAGGTGTCGTGGCCCAGCCGCTTCCACAGTTCCTCGGCGAGGTGCGG---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R M L G R N V L H A L G F D A F G L P A E Q Y A
- - - - - - - L H A L G F D A F G - - - - - - -
---------------------CAGTGGTTCGATCGCGGCGCGCGCCGCCAC---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V Q T G T H P R T R T E A N I V N F R R Q L G R
- - - - - - - - - - - E A N I V N F R R Q L G R
---------------------------------GTTGCGAAGGGCCGCATAGTCTTCGCGCACACCTTCGAT
145146147148149150151152153154155156157158159160161162163164165166167168
L G L G H D T R R S F S T T D V D Y Y K W T Q W
L . . . . D - - R S F S T T D - - - - - - - - -
CGT------------GCG------CTCGTCGCTGAGTGCCTCGTG---------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I F L Q I Y N A W F D R D Q N K A R R I S E L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E E F E S G K R T L D D G R N W A D L S K G E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A D V I D G Y R L V Y R A D S M V N W C P G L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T V L A N E E V T S E G R S D R G N F P V F R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R L R Q W M M R I T A Y S D R L L E D L D V L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
W P E K V K T M Q R N W I G R S T G A S V L F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T A A D D I E V F T T R P D T L F G A T Y L V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A P E H D L V D T L V T D A W P D G T D E R W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y G A A T P R E A V A A Y R T D I A A K S D L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R Q E N K T K T G V F L G A Y A T N P A D G K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V P I F I A D Y V L A G Y G T G A I M A V P G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D Q R D W D F A K E F G L P I I E V V T G G D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S E A A Y A G D G T M V N S G F L D G M D V A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A K E A I I A R L E A D G R G K R R V E Y K L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D W L F A R Q R Y W G E P F P I V Y D A D G R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
H P L P E S A L P V E L P D V P D Y S P V L F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P D D A D S E P S P P L N K A T E W V H V E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L G D G L Q S Y T R D T N V M P Q W A G S S W Y
- - - - - - - - - - - - - - - P Q W A G S S W Y
---------------------------------------------CGCGCCGTAGGTCCAGCGCTCGTCGGT
601602603604605606607608609610611612613614615616617618619620621622623624
E L R Y T D P H N P D E M C A K E N E A Y W M G
E L - - - - - - - - - - - - - - - - - - - - - -
GCCGTC------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
P R P D E H G P E D P G G V D L Y V G G V E H A
- - - - - - - - - - - - - - - L Y V G G V E H A
---------------------------------------------GGCCGCGGTCGCGAACAGCACCGAGGC
649650651652653654655656657658659660661662663664665666667668669670671672
V L H L L Y S R F W H K V L Y D L G Y V S S R E
V L . L L Y S R F W H K V L - - - - - - - - - -
ACCCGT---GCGGCCGATCCAGTTGCGCTGCATGGTCTTGAC------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
P Y R R L V N Q G Y I Q A F A Y T D S R G T Y V
- Y R . L V N Q - - - - - - - - - - - - - - - -
---GAGGAG---GTCGGAGTACGC------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P A A E V I E R D G K F F W P G P D G E I E V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Q E F G K I G K S L K N S V S P D E I C D N Y G
- - - - K I G K S - - - - - - - - - - - - - - -
------------GTCGGCGCGGTACAC---------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A D T L R V Y E M S M G P L E A S R P W A T K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
V V G A H R F L Q R V W R V V I D E T S G N V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V V E H E A L S D E T L R L L H R T I E G V R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
D Y A A L R N N T A A A K L I E Y T N H L T K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
G V A A R A A I E P L V L M V A P L A P H L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E L W K R L G H D T S L A H G P F P E A D P Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L V E D T I E F P V Q V N G K V R G K I V V A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
D A D K A A L E A A A L A D E K V Q A F L A G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953
T P K K V I V V P G R L V N L V V
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_leu_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N Y N H N Q I E K K W Q D Y W D E N K T F K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N D N L G Q K K F Y A L D M F P Y P S G A G L H
- - - - - - - - - Y A L D . F P Y P S G . G L H
---------------------------AATTTCTTGCAT---TTCTTTTGATGTATCTTT---AATTTTAAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V G H P E G Y T A T D I I S R Y K R M Q G Y N V
V G H P E G Y T A T D I I S R Y - - - - - - - -
TTTAGCTCTCAATTTACCATTAACTTGAACAACGATTTCTACTTCATC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L H P M G W D A F G L P A E Q Y A L D T G N D P
L H P M G W D A F G - - - - - - - - - - - - - -
AGTTGGCCAAGGTTGGTACGTAATAGACTC------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R E F T K K N I Q T F K R Q I K E L G F S Y D W
- - - - K K N I Q T F K R Q I K E L . . . . D -
------------TAACATTTTAACGAAGCCTTCAATGTAAGGTTTATAAACTTC------------ACA---
121122123124125126127128129130131132133134135136137138139140141142143144
D R E V N T T D P E Y Y K W T Q W I F I Q L Y N
- R E V N T T D - - - - - - - - - - - - - - - -
---AATAAATACCATTAATTGACT------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K G L A Y V D E V A V N W C P A L G T V L S N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E V I D G V S E R G G H P V Y R K P M K Q W V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K I T E Y A D Q L L A D L D D L D W P E S L K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
M Q R N W I G R S E G A K V S F D V D N S E G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V E V F T T R P D T I Y G A S F L V L S P E H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L V D S I T T D E Y K D Q V K A Y Q T E A S K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S D L E R T D L A K D K S G V F T G A Y A I N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L S G E K V Q I W I A D Y V L S T Y G T G A I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A V P A H D D R D Y E F A K K F D L P I I E V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E G G N V E E A A Y T G E G K H I N S G E L D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L E N E A A I T K A I Q L L E K K G A G E K K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N Y K L R D W L F S R Q R Y W G E P I P V I H W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E D G T M T T V P E E E L P L L L P E T D E I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P S G T G E S P L A N I D S F V N V V D E K T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M K G R R E T N T M P Q W A G S C W Y Y L R Y I
- - - - - - - - - - P Q W A G S C W Y Y L - - -
------------------------------ACCAGATAAAGGATTAATTGCATATGCACCAGT---------
505506507508509510511512513514515516517518519520521522523524525526527528
D P K N E N M L A D P E K L K H W L P V D L Y I
- - - - - - - - - - - - - - - - - - - - - L Y I
---------------------------------------------------------------CGCTTTCAC
529530531532533534535536537538539540541542543544545546547548549550551552
G G V E H A V L H L L Y A R F W H K V L Y D L G
G G V E H A V L . L L Y A R F W H K V L - - - -
TTGATCTTTATATTCATCAGTTGT---TGAATCAACCAATGCATGCTCAGGACTTAAGAC------------
553554555556557558559560561562563564565566567568569570571572573574575576
I V P T K E P F Q K L F N Q G M I L G E G N E K
- - - - - - - F . K L F N Q - - - - - - - - - K
---------------------AGT---AAATACTTCTACTTT---------------------------AAC
577578579580581582583584585586587588589590591592593594595596597598599600
M S K S K G N V I N P D D I V Q S H G A D T L R
M S K S - - - - - - - - - - - - - - - - - - - -
TTTGGCACCTTC------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L Y E M F M G P L D A A I A W S E K G L D G S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
R F L D R V W R L M V N E D G T L S S K I V T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
N N K S L D K V Y N Q T V K K V T E D F E T L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F N T A I S Q L M V F I N E C Y K V D E V Y K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Y I E G F V K M L A P I A P H I G E E L W S K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
G H E E S I T Y Q P W P T Y D E A L L V D D E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E I V V Q V N G K L R A K I K I A K D T S K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
M Q E I A L S N D N V K A S I E G K D I M K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804
A V P Q K L V N I V A K
- - - - - - - - - - - -
------------------------------------
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_leu_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q N G A N S R S Q E Y Q G V S V D S R Y D P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A I E T K W Q Q S W A A A Q L D R T P E A D D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P K F Y A L S M F P Y P S G N L H M G H V R N Y
- - - Y A L S . F P Y P S G N L H M G H V R N Y
---------GCCCCGCGTTTT---CATAATTTGAATCACCAAAGGAATTTCATCGACGATGAGTGCCGATTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T I T D A I A R V K R R Q G F R V L H P M G W D
T I T D A I A R V - - - - - - - - L H P M G W D
ATCCAAGACGGGCCAGCCTTCAAGGTG------------------------CTGCCAAAGTTCCTCGGCAAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A F G L P A E N A A I D R G V Q P A D W T Y Q N
A F G - - - - - - - - - - - - - - - - - - Y Q N
GTGAGGGGC------------------------------------------------------CCCAGGCAT
121122123124125126127128129130131132133134135136137138139140141142143144
V A Q M R E Q L K Q L G L S Y D W D R E V T T C
V A Q M R E Q L K Q L . . . . D - - R E V T T C
GGGTGCATCGTTAAGTGCATTGGTCAGCTTCAT------------CGC------GAGCTGATAATCTTCTTC
145146147148149150151152153154155156157158159160161162163164165166167168
S P D Y Y R W T Q W L F L Q F F E A G L A Y Q K
S - - - - - - - - - - - - - - - - - - - - - - -
CAG---------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E A T V N W D P I D Q T V L A N E Q V D S E G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S W R S G A K V E R R Q L K Q W F L K I T D Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E E L L Q D L D Q L T G W P E R V R L M Q A N W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I G K S T G A Y L E F P I V N S S D R V K V F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T R P D T V Y G V S Y V V L A P E H P L V T Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T T P E Q Q T A V A A F A A E V S Q T S E L E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T A E D R P K R G V P T G G F V T N P F T G Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V P I W I A D Y V L V E Y G T G A V M G V P A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D S R D F A F A Q R Y G L P V Q P V I Q P T E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A I A E P W P A P F T E A G V M V N S G Q F D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L S S T E A K A K I I A F A E E Q G W G Q A H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q Y R L R D W L I S R Q R Y W G C P I P I V H C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P D C G P V A A A D L P V Q L P D S V Q F S G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G P S P L A Q L E D W V T T T C P S C G K P A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R E T D T M D T F M C S S W Y Y L R Y S D A S N
- - - - - - D T F M C S S W Y Y L - - - - - - -
------------------ACCCATTACGGCACCCGTGCCGTACTCAACCAA---------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P E I A F T K D K V N D W L P V D Q Y V G G I E
- - - - - - - - - - - - - - - - - Q Y V G G I E
---------------------------------------------------GCCGCGTTTGGGGCGATCTTC
553554555556557558559560561562563564565566567568569570571572573574575576
H A I L H L L Y S R F F T K V L R D R G L L S F
H A I L . L L Y S R F F T K V L - - - - - - - -
TGCTGTCCGCTC---TTCGCTGGTTTGGCTGACTTCCGCTGCAAAGGC------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D E P F K R L L T Q G M V Q G L T Y K N P K T G
- - - F . R L L T Q - - - - - - - - - - - - - -
---------CTG---CACCAACGGATGTTC------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K Y V P S D R I S D P S Q P V D P D T G D R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
V F F E K M S K S K Y N G V D P A R V L D R Y G
- - - - K M S K S - - - - - - - - - - - - - - -
------------GGCCTGCATCAAGCG---------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A D T A R M F I L F K A P P E K D L E W D D A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
V E G Q F R F L N R V W R L V Q T A S Q V E A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
T A A D D K A E K D L R R A V H T A I Q A V T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D L E E D Y Q L N T A I A E L M K L T N A L N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A P M P G S P A Y L E G V Q T L V L L L A P F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
P H I A E E L W Q Q L G G E R S V H L E G W P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L D E S A L I V D E I P L V I Q I M G K T R G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I T V P A S A D R D Q L Q Q L A E N S E I A Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
W L D G Q T I R K V I V V P G K L V N F V I A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865
P
-
---
Class I
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_leu_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K E Y R P Q E I E K K W Q E V W E E K K V F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T P Q R S E K P K Y Y A L V M F P Y P S G T L H
- - - - - - - - - - Y A L V . F P Y P S G T L H
------------------------------TATGCCCTCGTG---TTTCCGTATCCCTCTGGAACTCTCCAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V G H V K N Y V I G D I V A R Y K R M R G Y N V
V G H V K N Y V I G D I V A R Y - - - - - - - -
GTAGGGCACGTGAAAAACTACGTCATAGGTGACATAGTTGCAAGATAC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L H P F G Y D A F G L P A E N A A I E K G I H P
L H P F G Y D A F G - - - - - - - - - - - - - -
CTTCACCCGTTCGGATACGACGCATTCGGA------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E W T R K N I A T I R Q Q V K K L G I S Y D W
- - - - R K N I A T I R Q Q V K K L . . . . D -
------------AGGAAGAACATTGCCACCATTCGGCAGCAGGTGAAAAAACTC------------GAC---
121122123124125126127128129130131132133134135136137138139140141142143144
S R E I A T C D E E Y Y K W T Q W I F L Q L Y K
- R E I A T C D - - - - - - - - - - - - - - - -
---AGAGAAATAGCGACCTGCGAC------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N G L A Y K K K A A V N W C P K C K T V L A N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q V K D G K C E R C G T S V T I R H L E Q W F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K I T D Y A E R L L N D L D K L T G W P E H V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T M Q R N W I G K S T G A E I D F P V E G S D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K I R V F T T R P D T L W G V T F M A L A P E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P L V E E L V P E E K K E E L Q E F L E R V K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q D R F R R T S V E A E K E G F F L G R Y A I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P V T G E R I P I Y V A N Y I L M E Y G T G A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
M G V P A H D Q R D F S F A K K Y G I P I K V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I K P A D K D L D P E K M E E A Y E G E G I M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N S G P F D G T P S S E G I E K V I N W L E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G I G K R S V Q Y K L R D W L I S R Q R Y W G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P I P I I Y C E K C G V V P V P E E D L P V R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P K D V E F L P T G Q S P L S F H E G F K K T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
C P V C G G E A Q R E T D T M D T F V D S S W Y
- - - - - - - - - - - - - - - D T F V D S S W Y
---------------------------------------------GACACTTTCGTTGATTCTTCCTGGTAC
505506507508509510511512513514515516517518519520521522523524525526527528
F L R Y V N P H L E D K P F E P D D V N Y W L P
F L - - - - - - - - - - - - - - - - - - - - - -
TTCCTC------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V D Q Y I G G V E H A V L H L L Y S R F V T K V
- - Q Y I G G V E H A V L . L L Y S R F V T K V
------CAGTACATTGGAGGAGTGGAACACGCCGTACTG---TTGCTGTACTCCAGATTCGTAACCAAGGTA
553554555556557558559560561562563564565566567568569570571572573574575576
L H D L G Y L N F D E P F T N L F T Q G M I Y K
L - - - - - - - - - - - F . N L F T Q - - - - -
CTG---------------------------------TTC---AACCTTTTCACACAG---------------
577578579580581582583584585586587588589590591592593594595596597598599600
D G A K M S K S K G N V V S P D E M I E K Y G A
- - - K M S K S - - - - - - - - - - - - - - - -
---------AAGATGTCCAAGTCG------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D T L R M Y I L F M A P P E K D A E W S D A G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E G V H R F V K R L W N T F Y T V L P F V K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
N T E N L V L K N S T E K E L R R K L H S I I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
K I T E D I E G G F K F N T A I S G L M E L V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
H L S Q Y L N S V P Q E E W N R K L L R E I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
K L T L A L S P F A P H L A E E F W H D L G N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S L V V Q Q S W P S Y D P K A L E V E E V E I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I Q I N G K V R D K V V V P V D I S E E D L K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
I V L E R E R V K E Y V D G K P I R K F I Y V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824
G R I V N I V V
- - - - - - - -
------------------------
Class I
Bacteria/Thermus thermophilus/amino acid sequences/Tthermophilus_leu_aa
Bacteria/Thermus thermophilus/nucleotide sequences/Tthermophilus_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K Y N P H A I E A K W Q R F W E E K G F M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A K D L P G G R G K Q Y V L V M F P Y P S G D L
- - - - - - - - - - - Y V L V . F P Y P S G D L
---------------------------------GGCCCGCGCCAC---CAGGGGGGCGTCCTTGGGGATGTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H M G H L K N Y T M G D V L A R F R R M Q G Y E
H M G H L K N Y T M G D V L A R F - - - - - - -
GATCGTCCCCCGCACCCGCCCGTTCACCTGGACGGCCACCTCCACCACGTC---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L H P M G W D A F G L P A E N A A L K F G V H
- L H P M G W D A F G - - - - - - - - - - - - -
---CTCGGGCCAGCCCGCCTCAAAGAGGCTATC---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P K D W T Y E N I R Q A K E S L R L M G I L Y D
- - - - - Y E N I R Q A K E S L R L M . . . . D
---------------CATCTGCAGGTAGTAGCGAATGGCGGTGCGGTAGACCGGGGT------------CTT
121122123124125126127128129130131132133134135136137138139140141142143144
W D R E V T T C E P E Y Y R W N Q W I F L K M W
- - R E V T T C E - - - - - - - - - - - - - - -
------CTCGTAGAGGGCGTTCAGGAA---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E K G L A Y R A K G L V N W C P K C Q T V L A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E Q V V E G R C W R H E D T P V E K R E L E Q W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y L R I T A Y A E R L L K D L E G L N W P E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K A M Q R A W I G R S E G A E I L F P V E G K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V R I P V F T T R P D T L F G A T F L V L A P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H P L T L E L A A P E K R E E V L A Y V E A A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R K T E I E R Q A E G R E K T G V F L G A Y A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N P A T G E R I P I W T A D Y V L F G Y G T G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I M A V P A H D Q R D Y E F A R K F G L P I K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V I E R P G E P L P E P L E R A Y E E P G I M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N S G P F D G T E S E E G K R K V I A W L E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G L G K G R V T Y R L R D W L I S R Q R Y W G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P I P M V H C E A C G V V P V P E E E L P V L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P D L K D V E D I R P K G K S P L E A H P E F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E T T C P K C G G P A K R D T D T M D T F F D S
- - - - - - - - - - - - - - - - - - D T F F D S
------------------------------------------------------CCCGGGCTCCTCGTAGGC
505506507508509510511512513514515516517518519520521522523524525526527528
S W Y Y L R Y T D P H N D R L P F D P E K A N A
S W Y Y L - - - - - - - - - - - - - - - - - - -
CCTTTCCAGGGGCTC---------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
W M P V D Q Y I G G V E H A V L H L L Y S R F F
- - - - - Q Y I G G V E H A V L . L L Y S R F F
---------------CCTCTGGTCGTGGGCAGGGACGGCCATGATGGC---GGTGCCGTAGCCAAAGAGCAC
553554555556557558559560561562563564565566567568569570571572573574575576
T K F L H D L G M V K V E E P F Q G L F T Q G M
T K F L - - - - - - - - - - - F . G L F T Q - -
GTAGTCCGCGGT---------------------------------TAG---GTAGGCCCCCAGGAA------
577578579580581582583584585586587588589590591592593594595596597598599600
V L A W T D F G P V E V E G S V V R L P E P T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I R L E I P E S A L S L E N V R K M G A E L R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
H E D G T L H L W K P A V M S K S K G N G V M V
- - - - - - - - - - - - V M S K S - - - - - - -
------------------------------------GATCCTCACCTCCTT---------------------
649650651652653654655656657658659660661662663664665666667668669670671672
G P F V K E Q G A D I A R I T I L F A A P P E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E M V W T E E G V Q G A W R F L N R I Y R R V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E D R E A L L E T S G V F Q A E A L E G K D R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L Y G K L H E T L K K V T E D L E A L R F N T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
I A A L M E F L N A L Y E Y R K D R P V T P V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
R T A I R Y Y L Q M L F P F A P H L A E E L W H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
W F W P D S L F E A G W P E L D E K A L E K D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V E V A V Q V N G R V R G T I H I P K D A P L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V A R A E A L K V R N V R A H L E G K E V V K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878
I Y V P G K I L N L V V R G
- - - - - - - - - - - - - -
------------------------------------------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_leu_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T A R R D A L V A I E Q E K Q A Y W A A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L H E F D A P A P G E A R P A K Y L T T F P F P
- - - - - - - - - - - - - - - - - L T T F . F P
---------------------------------------------------GCCGGCGAGGCG---GAGGTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y M N G K L H L G H G F S L T K A E F A S R F Q
Y M N G K L H L G H G F S L T K A E F A S R F -
GTGTGTGACGTTCGACAACATCACGGCATCGTCGATGACGGGCTGCGTCGACATGGCCTGCTCCCCGTA---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R M M G R R S L W P F G F H V T G T P I A A C A
- - - - - - - L W P F G F H V T G - - - - - - -
---------------------GGACATGAAGGCCATCAGGGCCTTGCTCAT---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q K I A K E M Q Q Y G N P P Q F P A E L L E D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P K A M V V K E P T E A L G Q H K S K R G K S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P A K P Q W L I M Q S M G I P D S E I A K F A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P Q Y W L D Y F P P I A M E D L K S F G C H I D
- - - - - D Y F P P I A M E D L K S F . . . . D
---------------CGGCTTCGGGAACGGCTGCGTGACGACAGAGCCCTCGTGCTG------------CCA
193194195196197198199200201202203204205206207208209210211212213214215216
W R R S F M T T E R S P Y F D R F V R W Q F N I
- - R S F M T T . . S - - - - - - - - - - - - -
------CTCCATCGTGTGTGGCGC------CAT---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L R R E N L L N Y G K R Y C V Y S P R D G Q P C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A D H D R A S G E G V L P Q E Y A L V K L I V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N P L A Q P C F A E H K D I I G D R N V V L P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A T L R P E T V I G Q T N C W V S N K L N Y K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y Y V R N A K G E D E V Y I M T A R A A R N I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y Q N F Y V N G Q V G T D P E P L F E V E G A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
M V G I P L S A P L A P Y T T I Y T L P M A T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T E A K G T G V V M S V P S D S P D D Y I N F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q L L N K P E Y R V K L G I K D E W V V P F A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I P I I D I P E L G T E G A K F M C E K L K I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G P N A T E L L E E A K K V C Y Q Q G F Y H G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M I S G P Y A G V K V S E A K V K T H R D M E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A D Q C I R Y Y E P V R Q V I S R S G D E C V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A L C D Q W Y L E Y G K D D W K K L V Q D H I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K M D M F F P G V R N G F E E T L N W L A D W P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
C S R T F G L G T Y L P C D A S H T M I I D S L
- - - - - - - - - - - - - - - - - - - - - D S L
---------------------------------------------------------------GCCGTGGTA
601602603604605606607608609610611612613614615616617618619620621622623624
S D S T I Y M A Y Y T I D R F F N V G A D G S T
S D S T I Y M A - - - - - - - - - - - - - - - -
GAAGCCCTGCTGGTAGCACACTTT------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D L C G K A D N P Y G L A P E M F T D E V F E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I Y H G V G D A A T V A G A V R M P V E S L K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
M R N E F E Y W Y P V D L R C S G K D L I Q N H
- - - - - - - - - - - - L R C S G K D L I Q N .
------------------------------------GACGCCGGTACCCTTCGCCTCCGTGATGGTGGC---
697698699700701702703704705706707708709710711712713714715716717718719720
L T M F L Y N H A A I W P T D E S K W P R A I F
L T M F L Y N H A A I - - - - - - - - P . A I F
AGGCAGCGTGTAGATTGTCGTGTAAGGCGCCAG------------------------CAT---TGCTCCCTC
721722723724725726727728729730731732733734735736737738739740741742743744
C N G H I Q V D N E K M A K S R G N F I S L R E
C N - - - - - - - - K M A K S - - - - - - - - -
CACCTC------------------------GACCTGGCCGTTTAC---------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A M D M Y G A D A T R L T C A D A G D S M D D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
N F V R E T A A G F V L K M T T L L E Q A K E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V E R T D L R S G G Y N E F D K I F N N T M N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I I T R T E G F Y H R M Q F R M V L N T A F H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L S N E Y S Q Y K M Y C D D L N V H A Q L G R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
Y Y E V V A L M M M P L A P H T M E H L W Q N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L Q H E G S V V T Q P F P K P T A K L D Y S L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
V A S R V M T I A L K E I R S Q V I K N A K K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
G P V E E V I V Y T R R E Y T D W Q R Q A L E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
L H E L Y E A N G N T F P E D M A K Q V V A R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
T K I M S K A L M A F M S F V K G N V E K Y G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
Q A M S T Q P V I D D A V M L S N V T H N L S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
L A G V S V V R I L S A E D E T Y K E H D A A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
R K C L P G E P S V A L P P V V K R E
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_leu_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L S E C G Q S R F A L L G S P S M W R A S A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L L A H F S K D V G F A S Y P F T E L E A K W Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D F W L R N K T F R T P D I G E L D T S K P K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y I L D M F P Y P S G A G L H V G H P A G Y T A
Y I L D . F P Y P S G A . L H V G H P A G Y T A
TACATTTTAGAC---TTCCCATATCCCAGCGGTGCA---CTTCACGTTGGGCACCCAGCTGGTTACACAGCG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T D I L A R L K R M Q G A N V L H P I G W D A F
T D I L A R L - - - - - - - - L H P I G W D A F
ACAGACATCCTGGCAAGGTTG------------------------CTGCATCCAATCGGATGGGATGCTTTT
121122123124125126127128129130131132133134135136137138139140141142143144
G L P A E Q Y A L Q T G T H P R V T T E R N V N
G - - - - - - - - - - - - - - - - - - E R N V N
GGT------------------------------------------------------GAGCGAAACGTCAAT
145146147148149150151152153154155156157158159160161162163164165166167168
R F R Q Q L Q S L G F S Y D W D R E V S T T D P
R F R Q Q L Q S L . . . . D - - R E V S T T D -
CGCTTCCGGCAACAGCTGCAGTCACTG------------GAC------AGGGAGGTGTCGACGACAGAT---
169170171172173174175176177178179180181182183184185186187188189190191192
E Y Y K W T Q W I F L Q L F N K G L A Y Q A E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P V N W C P A L G T V L A N E E V I D G K S E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G D H P V V R L P M K Q W M L R I T Q Y A Q R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L D D L D E L D W P D S I K D M Q R N W I G R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E G A T I T F G L Q V Y T T R P D T I F G A T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
M V L A P E H P L L D S L T T A E Q K I D V N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y V R K A A L K S D L E R T E L Q K V K T G V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T G S H A I N P A T G K A V P I W V A D Y V L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S Y G S G A I M A V P A H D T R D Y E F A T Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q L P V V R V V Q G P S G E D N E L P F T G K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T A T S S S C A A A G L S L D G Q G T A E A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S V V R W L E Q Q G K G A A Q I N F K L R D W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F A R Q R Y W G E P F P I V Y A E G S D E P E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I S E E D L P L T L P E T D N F R P S G T P E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P L A N I T E W V H F V D P K T G K R Y R R E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S T M P Q W A G S C W Y Y L R Y L Q P W N T D R
- - - P Q W A G S C W Y Y L - - - - - - - - - -
---------CCGCAGTGGGCTGGATCTTGCTGGTACTACCTG------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A I D P E V E K Y W L P V D L Y V G G A E H A V
- - - - - - - - - - - - - - L Y V G G A E H A V
------------------------------------------CTGTATGTCGGTGGTGCGGAGCATGCTGTG
577578579580581582583584585586587588589590591592593594595596597598599600
L H L L Y A R F W H K V L F D L G V V S T K E P
L . L L Y A R F W H K V L - - - - - - - - - - -
CTG---CTGTTGTATGCCAGGTTTTGGCACAAGGTGCTG---------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
F R R L V S Q G M I L G E V E Y T A Y K D A Q G
F R . L V S Q - - - - - - - - - - - - - - - - -
TTCCGG---CTAGTGAGCCAG---------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Q Y V D E N H P E A T A V R V E E G Q V D K K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
N G F V L R S D P S V R V S T R A H K M S K S R
- - - - - - - - - - - - - - - - - - K M S K S -
------------------------------------------------------AAGATGAGCAAGAGC---
673674675676677678679680681682683684685686687688689690691692693694695696
G N V V N P D D V V T M Y G A D S L R L Y E M F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
M G P I R E T K V W S T K S V E G V H R F L A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S Y R L V T G S N V A D V E P T K D Q L R L L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A T I K R V T E E T E E L R F N T G I S A L M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
F V N S A F K W E E V P R S V L E P F V L L L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P Y A P H I A E E L W Q V L G H S D T L T Y E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
W P T Y N E E L L V S D T F N L P V Q V N G K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R G T V E V S K Q I S Q A D A E V A G R S I T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V S K F L E G K P L K K V I F V P G R I V N F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891
V G K
- - -
---------
Class I
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_leu_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K C L S R L Q A I E K K W Q R Y W S S R N T F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M A E P P V G S D R D K R D S K K F F V T F P Y
- - - - - - - - - - - - - - - - - - F V T F . Y
------------------------------------------------------GTATGCAGAAAG---TTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Y M N G R L H L G H L F S A T R A E F A V G Y
P Y M N G R L H L G H L F S A T R A E F A V G Y
ATGTTCCGAGAACGGCAGCTTTGTTACTAGCGCGTCCGGGCCGTCTGTCTTGGATGCAGATATGAGTTGTGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H L M R G D S S L F P F G F H V T G M P I C G A
- - - - - - - - L F P F G F H V T G - - - - - -
------------------------ATCTTTCTTTGGTGTTTCTAGGACGTCTAT------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A K K L A D E I E H Y G C P P V L P T A D S L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L P G S V T A S E N A I D K V G Q F K A K K A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L N A K T V S K S Q W D I L I D L G V P E K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P K F V D P Y H W V K H F P A L C Y K D M C K F
- - - - - - - - - - K H F P A L C Y K D M C K F
------------------------------CACACGCAGCTGCTTCAGTGCCTCTGCTAGTGTATCCTGAGA
193194195196197198199200201202203204205206207208209210211212213214215216
G A R V D W R R S M I T T D A N P Y Y D L F V K
. . . . D - - R S M I T T D - - - - - - - - - -
------------ACG------GGAGTTCGACCTACCAAGTAC------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
W Q F R K L Y R D G Y I K F G K R N C I W S P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D G Q A C M D H D R F S G E G V Q P Q E Y I G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K L E L I N Y T T L L E E Q R E Q Q Q E G E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G D G M D D S L A E K L N I K L P R F Y S N P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N K A I F D Q L W E N Q V D N A K V Y L L A A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L R P E T M V G Q T N C W V L P T G R Y G A Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I N K D E V I I V S E H A A V N M A H Q G L N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N K P F G E L D F I C E I S G S D L L L A T V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A P L S P Y E Q I F V L P L E T I K M D K G T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I V T S V P S D A P D D Y A C Y K D I L E N R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G I A E K Y G V D V G L M L E P Y S P L P I I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I P D I G T L S A V R L C E E S N V S S L H D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A K L T Q I K E I C Y T K G F Y T G I M K M G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F A G Q C V K D C K Q S C R D L L V Q N N Q C I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V Y S E P E S E V I S R S N C V C V V A A A D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
W Y L D Y G N V A W K D K V R Y N I E K Y L N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Y H D E V K N Q F N R T V D G F R E W A A S R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
F G L G T K L P F D E R Y V I E S L S D S T I Y
- - - - - - - - - - - - - - - E S L S D S T I Y
---------------------------------------------CTTTACACACTGGCCGGCAAATGGGCC
649650651652653654655656657658659660661662663664665666667668669670671672
N A Y Y T V A H Y L Q G G S L D G S T S L F P V
N A - - - - - - - - - - - - - - - - - - - - - -
CATCTT------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E I V D D S F F D Y V F D L S N N L P E K F M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Y F S T D P A G A D R L H Q L K K S L L V P G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
N S Q I I L A I R S A E D L L T A M R E S F C F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
W Y P V D L R C S G K D L I P N H L T M M L Y N
- - - - - L R C S G K D L I P N . L T M M L Y N
---------------AATTGTCTCCAGAGGCAAAACAAAGATTTGCTC---AGGACTGAGAGGGGCTCGGAC
769770771772773774775776777778779780781782783784785786787788789790791792
H T A I W S D D E A K W P R G M R A N G H L Q L
H T A I - - - - - - - - P . G M R A N - - - - -
GGTAGCCAAGAG------------------------TAT---ATCCAATTCTCCAAA---------------
793794795796797798799800801802803804805806807808809810811812813814815816
N D A K M S K A T G N F L T A D E A I R K Y G A
- - - K M S K A - - - - - - - - - - - - - - - -
---------GTGGGCCATGTTCAC------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
D A V R F A L A D A G D G L D D A N F R E E T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
N N A V L R L Y N L L A T C Q E L L A A S A V C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
Y P E S Y E D I Y S T I E A S S A D C I H E C V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
F L A S I L D C T L R A C S A F E R C S F R E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
L I I S F N E L G H S R D Q Y I H S C E T R R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
P Y C R F L I E E Y V S T Q A K L L A V I C P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
I A E E L N A E V L G R S N S I F R D P L Q S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
D T L A E A L K Q L R V F L K I D E Y V Q A T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
V R L K N Y L V D V L K P R K D G T V K L P N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
A K I A Q V Y V A Q D C P E W Q T R V A E F L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
S M Y Y D E T E E Y G G L G A L P K D A S S R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
010611062106310641065106610671068106910701071107210731074107510761077107
S K Y C I D V L E T P K K D L Q K V M K Y A A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
810791080108110821083108410851086108710881089109010911092109310941095109
L I S A S K T D G P D A L V T K L P F S E H K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610971098109911001101110211031104110511061107110811091110111111121113111
L S A Y S D A V R T G L G V E Q I S F Y M V G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
411151116111711181119112011211122112311241125112611271128112911301131113
G P V P P E S C K A A T P G K P I V F F E
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_leu_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E S S A P Q S I H Y Q P A A I E K R W Q N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W R N D R I Y Q T P Q N S D G E A F Y A L S M F
- - - - - - - - - - - - - - - - - - Y A L S . F
------------------------------------------------------TACGCTCTTTCG---TTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Y P S G K L H M G H V R N Y V I T D V I A R A
P Y P S G K L H M G H V R N Y V I T D V I A R A
CCCTATCCTTCAGGGAAACTTCATATGGGGCATGTGCGTAACTATGTAATCACTGATGTAATTGCAAGAGCG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q R M R G K R V L H P M G W D A F G L P A E N A
- - - - - - - - L H P M G W D A F G - - - - - -
------------------------TTGCACCCTATGGGATGGGATGCATTTGGT------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A I E R G I D P S K W T N T N I Q Q M R K Q L D
- - - - - - - - - - - - N T N I Q Q M R K Q L D
------------------------------------AATACTAATATTCAGCAGATGCGAAAACAACTCGAT
121122123124125126127128129130131132133134135136137138139140141142143144
Q L G L S I D W E R E I S T C N E D Y Y R W T Q
Q L . . . . D - - R E I S T C N - - - - - - - -
CAACTA------------GAT------CGAGAAATCTCTACCTGCAAT------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
W L F L Q F Y D A G L A Y Q Q E A T V N W D P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D Q T V L A N E Q V N G D G C S W R S G A K V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K R K L R Q W F L R I T N Y A E I L L R D L D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L T G W P E R V R T M Q A N W I G R S K G C E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S F L I Y N E E D R L T D Q F I T V F T T R P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T I C G I S Y I A V S V D H D I V S Q S L M T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D R S R I Q R F C K E I S F Q K D N N H I S S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q I K Q G I P L G K Y A C H P L N G R R I P I W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I A D Y V L A D H G T G A V M G V P A H D Q R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F I F A H S Y G L I I K P V I I S E N T N H N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L S F S N I Q S A F I D L G K L I K S G I F D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L S S E E A G E A I L S Q A Q L A R W G Q S K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T Y K L H D W L I S R Q R Y W G C P I P I I H C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q S C G T V P V P T T D L P V E L P K N L N L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G K G G S P L S L V S K W V K T S C P K C G Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A Q R E T D T M D T F M C S S W Y F L R Y S D P
- - - - - - - - D T F M C S S W Y F L - - - - -
------------------------GACACATTTATGTGTTCTTCTTGGTATTTCTTG---------------
529530531532533534535536537538539540541542543544545546547548549550551552
S N K K E P F S S E K I Q D W L P V N H Y V G G
- - - - - - - - - - - - - - - - - - - H Y V G G
---------------------------------------------------------CACTATGTAGGTGGT
553554555556557558559560561562563564565566567568569570571572573574575576
I E H A I L H L L Y S R F F T K V L N D R G L L
I E H A I L . L L Y S R F F T K V L - - - - - -
ATAGAACACGCAATTCTC---TTACTTTACTCTCGTTTTTTTACCAAGGTATTG------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N F S E P F I R L L P Q G M V Q G I T Y K V P S
- - - - - F . R L L P Q - - - - - - - - - - - -
---------------TTT---CGCCTTTTGCCTCAA------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T G E Y I P V D N I T D L D N P I D P N S G E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L E V I F E K M S K S K G N G V D P T R V I E H
- - - - - - K M S K S - - - - - - - - - - - - -
------------------AAAATGTCCAAATCA---------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
F G A D T A R M F I L F K A P P E K D L E W N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S D V E G Q F R F L Q R I S R L V E M V L K K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
I R L N L K E D L S T T I N S K K L N K D E Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
V H R A T H Y A I A A I T E D L D G E V Q L N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A I A E L M K L N N I L S S V S D S I S E P I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L E G L K T L I I L L A P F A P H L S E E L W S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
R L V N D S N S I H N Q R W P I L D P S A L I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E N I K L V I Q V N G R V R G F I D V P A N A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K E K L E K L A L N S E S A Q K W I S G K L P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878
R V I T V P G K L V N I V L
- - - - - - - - - - - - - -
------------------------------------------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_leu_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_leu_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N C N E H E S T K L N Y L N S L E K S R D V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T D I S D K P K Y F I T F P Y P Y M N G K L H L
- - - - - - - - - F I T F . Y P Y M N G K L H L
---------------------------TTTATTACTTTT---TATCCATATATGAATGGAAAACTACATCTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G H L Y S I S K A D F M S Y Y K E L Q G F N V L
G H L Y S I S K A D F M S Y Y - - - - - - - - L
GGTCATTTATATTCGATATCAAAAGCAGATTTTATGTCATATTAT------------------------TTA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F P L A F H C T G M P I A A L A K K L G E E L E
F P L A F H C T G - - - - - - - - - - - - - - -
TTTCCTTTGGCTTTTCATTGCACAGGT---------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G K K T D I S T K E I I Q N L G F N D V M P F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D P V H W I K T F P K L C I S S L K T F G A N I
- - - - - - K T F P K L C I S S L K T F . . . .
------------------AAAACATTTCCTAAGCTGTGCATTAGTTCATTGAAAACTTTT------------
145146147148149150151152153154155156157158159160161162163164165166167168
D W R R S F V T T D I N K Y Y D S F V R W Q F F
D - - R S F V T T D - - - - - - - - - - - - - -
GAC------AGATCTTTCGTTACGACAGAT------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N L K E L G Y L S F G K R H S I Y C P L D K Q M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C L D H D R R K G E N I K P V R Q I M F K F H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H D K I L L V R Q N S I G K P Y K L V C G K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E V V S F K Y N N T S F L A E K I I F D N L K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q I N N V K Y K E S L V L S M D L K D G L T Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G T N I E V E V I E K N I L V V K T D T K S D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E L Y E K E I K A L N E I E E T L F T L S T S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E G I V E S V A K L S V E N T K D L L V Q T K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F I S V Y I P E K E V I S R S G G I C V V S L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D Q W Y I D Y S N E K W K S K V K K C L D N L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
C G P D T R S M L Y A G I D W V N K W G F S R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F G L G T K I P W D T Q Y L I D S L S D S T I Y
- - - - - - - - - - - - - - - D S L S D S T I Y
---------------------------------------------GATAGTTTAAGTGATAGTACAATTTAC
457458459460461462463464465466467468469470471472473474475476477478479480
M A F Y T V K H L L F E D L E G K L E I F P S N
M A - - - - - - - - - - - - - - - - - - - - - -
ATGGCA------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K L S N D V W D Y I F A G K D L V P E L Y G Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D L L E K C R N N F Q Y F Y P V D L R V S G K D
- - - - - - - - - - - - - - - - - L R V S G K D
---------------------------------------------------TTAAGAGTCAGCGGTAAAGAT
529530531532533534535536537538539540541542543544545546547548549550551552
L I K N H L L F F M F N H V A L F D E K Y W P K
L I K N . L L F F M F N H V A L - - - - - - P .
CTTATAAAAAAT---TTACTGTTTTTTATGTTTAACCATGTAGCGCTA------------------CCA---
553554555556557558559560561562563564565566567568569570571572573574575576
R I F T N G H L M L N K E K M S K S T G N F L S
R I F T N - - - - - - - - K M S K S - - - - - -
CGTATTTTTACTAAT------------------------AAAATGTCTAAAAGT------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V D D A L L K Y G K S A T R M C L A V C G D T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D D A N F V E D N A N L F I L K I Y T F V K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Q K L N E L V R K K S E N E T I A S Y S N A D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L L L E T V S V N V T E A L N A Y N S M K Y S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
V V K F S F F E M V N L I N L Y N N I N G T N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L L K N L V Y K S A T Q L L Y P I M P D L C R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L I E K Y F D S E F N L P E P K L K T N K M I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A F E Y I S E L I K K I A A S K Q A K N N S C V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
K I A V G K N Y P E W K K E I F E L I D K I D C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P R N N E I K K N K V F I A S L L D S V K P I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
Q K S K I N I T K G N N F V M D Y L V N P D K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V M K F N E Y E I I N E F K F Y I E N M S N K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884
A I L E E H C D A E P L N P I I T F S K
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_metALPHA_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_metALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A K Y V I G S A W P Y V Q T V P H L G N M I G
- - - - V I G S . W P Y V Q T V P H L G N M I .
------------CTGTTCCCACGG---TTTCCTAGAGTATTTCTGGTTTCTAAGCTCCTCTAATTTGGC---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S V L S A D V Y A R Y L R L K G H E V V F V S G
S V L S A D V Y A R Y - - - - - - - - V F V S G
TAAGGCCTTTACTTCTTCCTCTGTTATTTTCCT------------------------CGCTTTCCCCACGGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S D V H G T P V E V E A I Q L G V D P A E Y S M
S D V H G - - - - - - - - - - - - - - - - - - M
GGGCGGCCTCTTCGC------------------------------------------------------GCT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K M H A I V A E L F K K W N I S F D L Y T H T H
K M H A I V A E L F K K W . . . . D L Y T H T H
CTCGGGGATGGCCGGCGCAAGGCCTACTGCGAGGAATTT------------GGCGTGGTACATTACGGCGTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E T H I K F V Q D F Y L K I Y E N G Y I F T K
S - - - - - - - - - - - - - - - - - - - - - - -
TGC---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E D E V P Y C P R D K I Y L P D R F I I G K C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y C G Y E R A R G D Q C E N C G R L L D P K Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I E P K C A V C G S K P E W R I T K H W Y L D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R R L E D R I R K Y V E E N P H L P P N A K E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S L A M L K E G L R P R A V T R D N K W G I P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P F P G A E G K T I Y V W F E A V L G Y I S A V
- - - - - - - - - - Y V W F E A V L G Y I - - -
------------------------------CGTAGTGGTGGGCATCACGTAGCCGCCGCCATT---------
265266267268269270271272273274275276277278279280281282283284285286287288
V E Y F K K I G R E E E W K R F W L D P E T K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V F F V G K D N V P F H V I I L P A L L L A N G
V F F V G K D N V P F . V I I L P A L L L A . .
GTCCAGCCAGAACCTCTTCCACTCCTCCTCCCT---TATTTTTTTGAAATACTCAACTACGGCCGA------
313314315316317318319320321322323324325326327328329330331332333334335336
G G Y V M P T T T A S T E Y L L Y E G D K F S K
. . Y - - P T T . A S T - - - - - - - - K F S K
------AAC------AAACCACAC---TATAGTCTT------------------------CGGTATGCCCCA
337338339340341342343344345346347348349350351352353354355356357358359360
S R R W G V W I D E A L Q L L P A D Y W R F V L
S - - - - - - - - - - - - - - - - - - - - - - -
CTT---------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I Y I R P E N R D T N F S W S T A L E I I N K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L N D D V G N Y A N R V L S F I K N R M G G A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P P R G K P S R D D E E F I E K V K R L F E K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E A H Y E A I E L K D A V H T V V E I A R E G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K Y L N A R A P W D L V K K D V D A A N A V M Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
H A Y W S L K F L A V G L A P A I P E S A E Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
W K M M G L D A P L T W E E A K R P P A V G K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L G E V R P L F R K I T E E E V K A L L A K L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570
E L R N Q K Y S R K Y P W E Q V V I
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_met_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I G I K I L V N C A L P Y A N G P L H V G H I
- - - - - - L V N C . L P Y A N G P L H V G H I
------------------CTTGTAAACTGT---CTGCCTTATGCAAACGGGCCGTTACATGTTGGGCATATT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A G A Y L G A D V F V R F N R L I G N E V L Y V
A . A Y L G A D V F V R F - - - - - - - - L Y V
GCA---GCATACCTCGGTGCAGACGTATTTGTAAGGTTT------------------------CTATATGTA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S G S D E Y G T P I T V R A E K E G K S P Q E I
S G S D E Y G - - - - - - - - - - - - - - - - -
TCCGGAAGTGATGAATATGGA---------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A D R Y Y A E H I E T F K K L G I N F D I F M R
- D R Y Y A E H I E T F K K L . . . . D I F M R
---GATAGATACTATGCAGAACACATAGAAACATTCAAAAAACTT------------GATATTTTTATGAGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T T Y P E H S S V A Q E F F L K L L N E G V I E
T T Y - - - - - - - - - - - - - - - - - - - - -
ACAACGTAT---------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K G T M I A P Y C R K I G R F M P D R Y I E G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
C P Y C G Y K K A R G D Q C D N C G R T L D P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E L I N P V C I L S G E T P E F R E T E H F F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R L D L F E E R L E E W L K T K T F W K P N V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A Y T R N F I Q G G L K K R A I T R D I D W G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K V P L E G Y E H K R I Y V W F E A L I G Y I T
- - - - - - - - - - - - Y V W F E A L I G Y I -
------------------------------------TATGTGTGGTTTGAGGCTTTGATTGGATATATC---
265266267268269270271272273274275276277278279280281282283284285286287288
G A K M F S E V I G K P N Y W K E F Y F D K D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K N Y Y F I G K D N I P F H S I I W P A M L L G
- - Y Y F I G K D N I P F . S I I W P A M L L G
------TATTACTTTATAGGAAAGGACAATATACCTTTT---AGCATAATATGGCCGGCTATGCTGTTGGGC
313314315316317318319320321322323324325326327328329330331332333334335336
Y G E L N L P Y D I P A N E Y L T F K G E Q F S
Y - - - - - P . D I P A N - - - - - - - - Q F S
TAC---------------CCA---GATATTCCTGCAAAC------------------------CAGTTTTCG
337338339340341342343344345346347348349350351352353354355356357358359360
K S R G I G Y T V D E L L R V I P P D Y L R Y Y
K S - - - - - - - - - - - - - - - - - - - - - -
AAGAGC------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V A S I L P E T G D S D F S L E E L V K T V N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D L I D K Y G N F V H R T L S F I N K Y D L K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T K P N S L N D E A F E Y A Q N A F K E Y C D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L S Q V H I K R S L A I W L N L A I Y A N S Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N K S E P W N L I K T D R D Q C N Y K L Y V S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K L A Q Y L T A M I Y P F T P T S A K A I W E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L G V N M D I D S S F S I L N S I N D F S V K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543
S R I P F E K L D I D K L K L
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_met_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K V L V T S A W P Y V N A V P H L G N L I G S
- - - L V T S . W P Y V N A V P H L G N L I . S
---------TTAGTAACATCT---TGGCCTTATGTTAATGCTGTTCCACATCTAGGAAATTTAATA---TCT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I L S A D V F A R Y A R L K Y G K E N V V F V S
I L S A D V F A R Y - - - - - - - - - - V F V S
ATATTATCAGCAGATGTATTTGCAAGATAT------------------------------GTTTTTGTAAGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G S D E H G T P I E I E A R K R N I E P R K L T
G S D E H G - - - - - - - - - - - - - - - - - -
GGTAGTGATGAACATGGT------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D Q A H A Y D K K L F I D T W K I S F D N Y S R
D Q A H A Y D K K L F . D T W . . . . D N Y S R
GATCAAGCACATGCCTATGATAAGAAATTATTT---GACACATGG------------GATAATTATAGCAGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T E S E V H K E F V R N F L I K L E K Y I K V E
T E S - - - - - - - - - - - - - - - - - - - - -
ACTGAGTCT---------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E D E I P Y C E K D K L F L P D R F V K G V C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y C G F E D A R G D Q C D N C G R L L T P R S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I N A K C A L C G N P P V F K V T K H W F F D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S E F G D K I R D W I S S S S T M P D N V K S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A L S W V K E G L R P R S I T R D N M W G I P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P F K G A E N K T I Y V W F E A L L G Y L S A T
- - - - - - - - - - Y V W F E A L L G Y L - - -
------------------------------TATGTCTGGTTTGAAGCTCTTCTAGGTTATCTA---------
265266267268269270271272273274275276277278279280281282283284285286287288
V E Y F K N L G K E E M W K E F W L Y N D T K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y Y F I G K D N I P F H A V I L P A M L M A S N
Y Y F I G K D N I P F . A V I L P A M L M A S -
TATTATTTCATAGGAAAGGATAACATTCCTTTC---GCTGTTATATTACCTGCAATGTTAATGGCAAGT---
313314315316317318319320321322323324325326327328329330331332333334335336
E K Y N L P S V I A A T E Y L L Y E G Q K F S K
- - - - - P . V I A A T - - - - - - - - K F S K
---------------CCT---GTTATAGCTGCTACT------------------------AAGTTTAGCAAG
337338339340341342343344345346347348349350351352353354355356357358359360
S R K I G V W I D E A D K L M D V E Y W R F I L
S - - - - - - - - - - - - - - - - - - - - - - -
AGT---------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I R L R P E E K D T N F T W R E A L R I V N T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L N D D I G N Y A N R V L S M V K R Y C D G V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P S P K E A I L N D E D K N L I T L I T E S P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R M G E L F E L G K I K A G S E E I L K L A R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G N L Y L N N R A P W S L V K T N R D E A N N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L Y I S V N S L R T L A I M L Y P I M P T Y S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
N L Y Q Q L G L S D L E S E T W D S A G S L K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
M P G H K I G E I R S L F K K I D M S P E E L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571
K K L D E I R R E V E K E R P D L L R
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_met_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V Q I K I L V N C A L P Y A N G P L H I G H I
- - - - - - L V N C . L P Y A N G P L H I G H I
------------------TACCAGGGATTC---GTCGATCTTCTCGAATGGAATCGCCCCCCTGTGAACCGA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A G A Y L G A D V F V R Y N R L M G N Q V L Y V
A . A Y L G A D V F V R Y - - - - - - - - L Y V
AAA---GTGCATCTCATAGAGATGCCGGTACGATTGCCC------------------------GTTCCATAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S G S D E Y G T P I T V R A E K E G R S P K E I
S G S D E Y G - - - - - - - - - - - - - - - - -
CTTTTCCGCGGAGGATGGTAT---------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A D I Y Y E E H L R T F E N L G I S F D I F M R
- D I Y Y E E H L R T F E N L . . . . D I F M R
---ATCATGGTTCAGCTTTTGCCTGTCGTTCTTGATCGTCTTCCA------------GTTGAAGAAGCCATT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T T W P E H S E N A Q D F F I K L L N E G Y I E
T T W - - - - - - - - - - - - - - - - - - - - -
TGCATATAT---------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K G T M I A P F C R K I G R F M P D R Y I E G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
C P Y C H Y P K A R G D Q C D N C G R T L D P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D L I D P K C I L S G E T P E F R E T E H F F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R L D L L E D R L K S W I S S K N F W K P N V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A Y T Q N F I S G G L K K R P I T R D I D W G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K I P L D G Y D S K R I Y V W F E A L I G Y I T
- - - - - - - - - - - - Y V W F E A L I G Y I -
------------------------------------CTTGCCTATGAAGTAGTAATTCCTGACCTCGGG---
265266267268269270271272273274275276277278279280281282283284285286287288
G A K E Y S K R T G N P D L W K E Y Y M D P E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R N Y Y F I G K D N I P F H A I I W P A M L M G
- - Y Y F I G K D N I P F . A I I W P A M L M G
------CGCTTCGAACCACACATATATTCTCTTTGAATC---TCCGTCCAGAGGTATCTTGACACCCCAGTC
313314315316317318319320321322323324325326327328329330331332333334335336
Y G G F N L P Y D I P A N E Y L T F K G Q Q F S
Y - - - - - P . D I P A N - - - - - - - - Q F S
GAT---------------ACG---CTTCAGTCCGCCAGA------------------------GACGTTTGG
337338339340341342343344345346347348349350351352353354355356357358359360
K S R G I G Y S V D D L L K A V P A D Y L R Y Y
K S - - - - - - - - - - - - - - - - - - - - - -
CTTCCA------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V A S I L P E T G D S D F S L E E L V N T V N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D L I D K Y G N L V Y R I L S F M D R Y S I N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D P V D V S G D E E F K Y A Q R S F E L W S E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L S G V H V K R G L L R W L D L A I Y A N G F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N R S E P W K T I K N D R Q K L N H D L Y L S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K I T E V L T V M V Y P Y I P S S A E K I W N M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L G I P F A I G Q S Y R H L Y E M H A F S V H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547
G A I P F E K I D L E S L V S K L N N
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_met_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S Y E D Y P T D D P A V V T A G L P Y A N G D
- - - - - - - - - - - - V V T A . L P Y A N G D
------------------------------------GGTCGTGAGGAG---CGCGGCCTCGCCGGCGGCGAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L H I G H L R S Y V S A D A F T R A L Q K L G Q
L H I G H L R S Y V S A D A F T R A - - - - - -
CACCATCCCGTTGGACTCAACGCCGAACAGCTCCGCTTTCTCGAGGTTCGCGAC------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q A V Y V C G S D M H G T P I A V N A A E E G V
- - V Y V C G S D M H G - - - - - - - - - - - -
------GGCGTCGAGGTCGTGGAGCTGTTTGATACC------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D P E E F A L R H H K Q Y R E T F P K F N V D F
- - - - - - L R H H K Q Y R E T F P K F . . D -
------------------GTCCGCGCCCTCGATTCCCTCAGCGGTCTGGATTTCGCCGAC------GTC---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D Q Y G H T H D E T N T E L T K E F V R A W E D
- Q Y G H T H D - - - - - - - - - - - - - - - -
---CTGGAACTCCTCGAAGCCGAT------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N G Y V H E K E I D V A Y D P E A D Q W L P D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F V E G T C P Y C G E H A R G D E C D E G C Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
H L E P G E I E D P V S T I T G N P A E Y R R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E H K F L R L S A L Q E H L Q G F I N R V E G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S N A Q N Q P R E W I E G E L Q D L C I T R D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D W G I D Y P G E G A E D L V L Y V W V D A P I
- - - - - - - - - - - - - - - - Y V W V D A P I
------------------------------------------------CATCGCCTGCGCGATCTCGGTCTC
265266267268269270271272273274275276277278279280281282283284285286287288
E Y V S A T K Q Y S E R A G D L D W E S V W K D
E Y V - - - - - - - - - - - - - - - - - - - - -
CACCTCGTC---------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G D G E I V H V I G R D I I Q H H T V Y W P A M
- - - - - V H V I G R D I I Q H . T V Y W P A M
---------------GTCCGCGAGTTCGCTGTTCACGCGCTCCGCGAA---GTCCCACGAGAAGTTCACGTC
313314315316317318319320321322323324325326327328329330331332333334335336
L E A A D Y A E P R A V C A A G F V N I D G K G
L E A . . Y - - P . A V C A A - - - - - - - - G
GCGCTCGAA------GGC------CAT---GTACCGCAGGAGGTC------------------------CTC
337338339340341342343344345346347348349350351352353354355356357358359360
L S T S K N R A I W A E E Y L D E G F D P D L L
L S T S - - - - - - - - - - - - - - - - - - - -
CTCGGCCCAGAT------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R Y Y M T T A S G F E R D V N F S W D R F A E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V N S E L A D V V G N F V Y R A L L F A N R N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G G T P E A G L S D E V E T E I A Q A M D D Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D A L N D Y D L R T A G E R T V A L A R F G N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Y I Q R N E P W K L D D E E A T P V I R D C V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L V K A V A V L L Q P F T P E K A E E V W Q Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E E A D T V A D A T I A D C L Q E P P A E F G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P E E L F T K V E D D R V A E L D E T L Q E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E A A S A D D S E E T E G G E E S D V E L E P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A D D R I G F E E F Q S L D L R V G E I Q T A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G I E G A D D L A R L E V D I G H E V R Q I V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G I K Q L H D L D A L P G T K V V V V A N L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A E L F G V E S N G M V L A A G E A A D L L T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683
H G D S V P G T K V K
- - - - - - - - - - -
---------------------------------
Class I
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_met_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D S S S K P V L V T C G L P Y A N G K A H I
- - - - - - - - - L V T C . L P Y A N G K A H I
---------------------------TTCTTTGTCCGG---AAGAGCTGCTACAATCGCCCCGCCGTCATC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G H L R T Y V P A D I F A R S L R K E G R E V T
G H L R T Y V P A D I F A R S - - - - - - - - T
GGCTGCGAGCATCATGCCGTTTGACTCAACCCCGCAAAGTTTGGC------------------------TAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F V C G S D T H G T P I V V N A E E L G I T P K
F V C G S D T H G - - - - - - - - - - - - - - -
ATATTTGCCTACGAGCTCTTCGGAAGT---------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E L V E I Y H K H F D E T F K Q L G V Y F D A F
- - - E I Y H K H F D E T F K Q L . . . . D A F
---------CACTTCAACCCTCAGGAGTTTTCTGGACTTCTTTACAGGTTC------------CTTCCCTAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G T T D D P E N H N R T L D I V N R L I E K D Y
G T T D D - - - - - - - - - - - - - - - - - - -
CCTGATGTCAAGCTT---------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V Y P K I I E I A Y C P A C N R F L P D R Y V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G A C P H C G E T A R G D E C D Q G C G K H L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P G E L Q N P V C T I C G G P A E Y R H Q E H F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F F K L S E F G D Y L M D Y L S N D L G G T T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A R N Y A L G W V K Q G L T D W C I T R N L E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G V R F P G H E D L V V Y V W V D A P I G Y I A
- - - - - - - - - - - - Y V W V D A P I G Y I -
------------------------------------CTCGTGGGACTGGAAGTATGTGTTCCCGAAAGA---
265266267268269270271272273274275276277278279280281282283284285286287288
F T E E W A A Q A G D S W E K F W K G E G E I V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GGC
289290291292293294295296297298299300301302303304305306307308309310311312
H F I G G D I T Y H H C I F W P A M L N G A D Y
H F I G G D I T Y H . C I F W P A M L N G . . Y
TTCTTCGATTTCTGCGCTTACTTCAGGTTC---TTTTCCTTCGGGGACTTCTCCATAGTTCTT------AAA
313314315316317318319320321322323324325326327328329330331332333334335336
S V P T A V V A S G M V K I E D K K F S K T R G
- - P . A V V A S - - - - - - - - K F S K T - -
------GGT---GTACAGGAAGTTGCC------------------------GATCTTTTCCTGGAG------
337338339340341342343344345346347348349350351352353354355356357358359360
Y V V W V G E D Y L D H G F H P D L L R Y Y L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S Y T S H T K E L N F S W R V L Q E K I N A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V A V L G N F L Y R T M L F A F K N Y G E V P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G K L E P E V S A E I E E A L K E V K E A M A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y E F K K A V D S A M A L A S F G N T Y F Q S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E P W K L I K E D R S A C G Q V I Y N C L H L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K A L S L I F E P V L P Q T M E T A W K G L G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E S D I H A S R Y E E A L V P L K A G T K L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P E L L F T K L E D D R I G E M E E I A N Q R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K A A N A K K S A A K G G E K E P S K S E G M G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
P S E E A K V A E K A A K A E E K V P I E T L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q I E Y E D F A K L D I R V G K V L F V E P V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K S R K L L R V E V D I G E E K P R Q L V A G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A S Y Y T S E E L V G K Y V V V L A N L K P A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L C G V E S N G M M L A A D D G G A I V A A L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708
P D K E I K P G S R I R
- - - - - - - - - - - -
------------------------------------
Class I
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_met_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N N K Y L L T T A L A Y T N G P L H L G H A R
- - - - - L L T T . L A Y T N G P L H L G H A R
---------------TCCTACTGGAAG---TTTTTCAGGCGATAATAAAGCCACTTCCTCATCACCAGCAGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S T Y I P A D I I K R Y L K L K G N D V I H V G
. T Y I P A D I I K R Y - - - - - - - - I H V G
---TACCATTCCTTGGGATTCAACGCCACATAATTT------------------------TACAATTTTTTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G T D N H G V P I T L T A E K E G V K P E D I V
G T D N H G - - - - - - - - - - - - - - - - - -
ACCAATTAATTCTTCTGG------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N K Y H N E I K R D L D N L S V E F D S Y G K T
N K Y H N E I K R D L D N L . . . . D S Y G K T
TACAATTAATTTTAAAAGTTTTTTGGACTTAGGAACTTCCTC------------TTGAGCAACTTTTAATTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H S D T H I Q N A Q E F Y K K L K E N G Y I Y E
H S - - - - - - - - - - - - - - - - - - - - - -
AATTTT------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K E I E Q F Y C P D C D K F L A D R Y V E G S C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P F C E G E A R G D H C E V C G R H L E P T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V N P Y C V I C N A T P Q L K K T T H Y F F K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S A L S D N L D N Y V K N S N M P D H I K N M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y S W I R E L H D W D I S R G I K W G V P I P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D E N Q V M Y V W L E A P I G Y I S F T K M M G
- - - - - - Y V W L E A P I G Y I - - - - - - -
------------------TTCCGAGCATTTATCAAGTAAAGCCAAATCTTC---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D I W K E Y W L K N N D N N T E N Q N T K I W H
- - - - - - - - - - - - - - - - - - - - - - W H
------------------------------------------------------------------TGCAAT
289290291292293294295296297298299300301302303304305306307308309310311312
F I G K D I T V H H A V F W P G M L L G H G E Y
F I G K D I T V H . A V F W P G M L L G . . . Y
GATTGCAATGAGCTCCGTATTTATCCT---TTGGAATTCATCAAATGAAAAATCACAATC---------TGG
313314315316317318319320321322323324325326327328329330331332333334335336
N L P N S I F S G G Y L T L E G K K M S T S K K
- - P . S I F S G - - - - - - - - K M S T S - -
------TGC---TAAAAAGTATCTCAA------------------------AAAATCATCGACCCA------
337338339340341342343344345346347348349350351352353354355356357358359360
W V V W V D D F I K Y F D S D Y L R Y F L M A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A P L N R D C D F S F D E F Q K R I N T E L I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I I A N F T H R A L V F S H R K F G A L P V I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K P E E E L N K E D L A L L D K C S E T I E K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N K N M M D C N L K D A L V D I I H L A K E G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N Y F Q K M E P W T V D D E N R L K Q I M F V C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G V I T K H I A Y L L Y P F M P N K T N E L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L M N E E M D L E I R G N E L K K P I V V F S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I E N D T I K M V K E K L L K S E N S K N T K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K K K N T K K N K N G E K M E L I G I D D F A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I E L K V A Q I L E A E E V P K S K K L L K L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
V D I G D E K R Q V V A G I K G H Y T P E E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G K K I V L V C N L K P A K L C G V E S Q G M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L A A G D E E V A L L S P E K D L P V G S T I C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_met_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N S R P L L V T C G L P Y T N G P C H L G H L
- - - - - - L V T C . L P Y T N G P C H L G H L
------------------CTTGTTACCTGT---CTTCCCTATACCAACGGCCCCTGCCATCTCGGCCATCTC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R T Y V P A D F Y V R F M R R K G E E V V F I C
R T Y V P A D F Y V R F - - - - - - - - V F I C
CGGACATATGTACCTGCGGATTTTTACGTGCGGTTC------------------------GTCTTTATCTGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G S D N H G T P I V V S A E K E G T T P R Q I S
G S D N H G - - - - - - - - - - - - - - - - - -
GGCTCGGATAATCATGGA------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E R Y H T H F S D T F T K M Q V H F D H F G M T
E R Y H T H F S D T F T K M . . . . D H F G M T
GAACGGTATCATACCCATTTCTCTGACACCTTCACCAAGATG------------GATCACTTCGGGATGACC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D D P T T H A R T K H L V S R L I D R G Y V Y P
D D - - - - - - - - - - - - - - - - - - - - - -
GATGAT------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K V I Q Q A Y C I H C Q K F L P D R Y L E G I C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P H C K K P A R G D E C D Q G C G K H L E P G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I L E P T C K I C G N R A E Y R E Q E H F F F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L S G F Q D W L R E Y L G E L K G T D N A I N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A L G W V N E D L H D W C I T R T L E W G V K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P G H D D L V V Y V W V D A P I G Y I G F T E E
- - - - - - - - Y V W V D A P I G Y I - - - - -
------------------------TATGTATGGGTTGATGCCCCCATTGGATATATC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
W A E K T G R D W K T Y W C G E N T R V T H F I
- - - - - - - - - - - - - - - - - - - - T H F I
------------------------------------------------------------ACCCATTTTATC
289290291292293294295296297298299300301302303304305306307308309310311312
G Q D I T Y H H C V F W P A M L H G A G Y G T P
G Q D I T Y H . C V F W P A M L H G . . Y - - P
GGACAGGACATTACCTATCAC---TGTGTCTTCTGGCCGGCCATGCTCCATGGT------TAT------CCC
313314315316317318319320321322323324325326327328329330331332333334335336
Y A V V A S G M L K I D D H K F S K S R G Y V V
. A V V A S - - - - - - - - K F S K S - - - - -
---GCAGTAGTTGCCTCA------------------------AAGTTCTCTAAGTCA---------------
337338339340341342343344345346347348349350351352353354355356357358359360
W T N E D Y L D Q G L P A D Y L R Y Y L L S Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S H T K E M N F S W Q L F Q E R I N N E V V N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L G N F I Y R S L H L S Q K Q F G G V P E G V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E Q E I F D R I T E A I G Q V T G L V E A Y D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K G A V D A I L A L S A W G N T Y I Q S K E P W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K L A K T D Q A A M A Q V M R N C L Q L A K A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T L L I E P V M P E R A G L I W S Q L G Q D S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I A N N G F S A G L E P L S P G P L P A P S I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F S K I D D K M T Q E L D K R L R D R I D A L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A E K K P K T P E I S I E E F A K V E M K T G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I L S A E Q V P K S T K L L K L Q V S I G D E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R Q I V S G I A Q F H N P E E L V G K D V V V C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
T N L K P A K I F G I E S N G M I L A A G D N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664
S L L R P E T P V P S G T K I R
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_met_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R Y L I T T A L A Y T N G P L H L G H A R S T
- - - L I T T . L A Y T N G P L H L G H A R . T
---------CTAATAACAACT---TTAGCTTATACAAACGGCCCTCTACATTTAGGGCATGCAAGA---ACT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y I P A D I I Y K Y L K L R G E D V I H V G G T
Y I P A D I I Y K Y - - - - - - - - I H V G G T
TACATCCCAGCAGATATTATATATAAATAC------------------------ATCCACGTTGGAGGAACT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D N H G V P I T L T A E K E G K S P E E I V E K
D N H G - - - - - - - - - - - - - - - - - - E K
GATAACCACGGA------------------------------------------------------GAAAAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y H N E I K E D L D L L G V E F D A F G K T H S
Y H N E I K E D L D L L . . . . D A F G K T H S
TACCATAATGAGATTAAAGAAGATTTAGATTTGTTA------------GATGCATTTGGCAAAACTCACAGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q I H I E T A Q E F Y L K L K E N G Y I Y E K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I E Q F Y C P N C K K F L P D R Y V E G I C P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
C G G E A R G D H C E V C G R H L E P F E L K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P Y C V I C K G K P E I R K T K H H F F K L S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L K K E L E E Y I K N A K E M P E H V K N M A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N W I K E L H D W D I S R D I S W G V P I P G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N Q V M Y V W L E A P I G Y I S F T K M L G E I
- - - - Y V W L E A P I G Y I - - - - - - - - -
------------TATGTTTGGTTAGAAGCCCCTATTGGCTATATC---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
W K K Y W L E K D T K I Y H F I G K D I T V H H
- - - - - - - - - - - - Y H F I G K D I T V H .
------------------------------------TATCACTTCATTGGAAAGGATATAACTGTTCAT---
289290291292293294295296297298299300301302303304305306307308309310311312
A V F W P G M L I A H G S F N L P T A V V S G G
A V F W P G M L I A . . . . . L P . A V V S G -
GCCGTTTTCTGGCCAGGAATGTTGATTGCT---------------TTACCA---GCAGTAGTTAGTGGA---
313314315316317318319320321322323324325326327328329330331332333334335336
Y L T L E G R K M S T S K R W V V W V K D F V K
- - - - - - - K M S T S - - - - - - - - - - - -
---------------------AAGATGAGCACAAGT------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N F D A D Y L R Y Y L I M S A P L F K D C D F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F D D F K N K I N N E L I N I I G N F T H R V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T F T H R K F K K V P I V D E D R L K E E D K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L L K K C E E T L E A V D K N I R S F K F R D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L V N I L H L A I E G N S Y F Q K M E P W A V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D E E R L K E I L Y T C C K T V K T L V Y L L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P Y M P K K S L A L L E L M N E E L D L E L R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
N E L K K P K I I F K K I D N K K I E E M K K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L Y E N K K E E T K G G E K M E Q I D I S Y L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K I D L R V G E V V E A E D I P K S K K L L K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
M V D L G D E K R Q I V S G I K G Y Y K P E D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
V G K K V I V I C N L K P A K L C G V L S E G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
I L A A E D D E G N V S L L T V D K D I K A G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651
K V R
- - -
---------
Class I
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_met_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G K V L V T T A L A Y T N G P L H I G H V R S
- - - - L V T T . L A Y T N G P L H I G H V R .
------------CTCTCCGGGCTC---TTCCCTCTTACTCTCGTCGATAGTCAACAATGCGGGTTCGTC---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T Y L P A D V Y T R F L K M R G I D A I H I G G
T Y L P A D V Y T R F - - - - - - - - I H I G G
AACGGCCAGGATCATCGCTTCCGACCGTACGCC------------------------GGCTAGTACAACCAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T D N H G V P I A L Q A E L E G K D P E E I V E
T D N H G - - - - - - - - - - - - - - - - - - E
CTTACGTCCGACGAG------------------------------------------------------TCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K Y H E M I K E D L E R L N I H F D E F S C T C
K Y H E M I K E D L E R L . . . . D E F S . . .
GATATCGATCCGGAGCTTGATGAGTCGATCAGAGCCCTC------------TTCTTTGATCTT---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R E F N P D H V D M T Q W F F K R L Y E A G Y I
R E F N - - - - - - - - - - - - - - - - - - - -
CAGGTCTAATCG------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E E R E V E Q L Y C P E C E R P L P D R Y V E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V C P Y C G A E G A R G D H C E A C G R Y L E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V Q L E E P R C V I C G S K P E V R R T M H L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F K L S E F E E D L K K W L E S N D N L P K N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R N Y A I Q W V R E G L K D W D I V R D L D W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V P V P L E G Y E D K V F Y V W F D A P I G Y V
- - - - - - - - - - - - - Y V W F D A P I G Y V
---------------------------------------TATCTCCTGGTCAGTCTCGGCTTCGGGAACGTT
265266267268269270271272273274275276277278279280281282283284285286287288
T F T K Q Y C D R V G Q D W K D Y W F S E D T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I V H F I G K D I I V H H A L F W P A M L M G V
- V H F I G K D I I V H . A L F W P A M L M G .
---CACACGGTCCCGGAAGTCTCCCCACGAGAAATC---ATCCCTGGTGAGCGGGCTCACCACTATGAG---
313314315316317318319320321322323324325326327328329330331332333334335336
G A T L P Y T I V A G E Y L T L E G E K M S T S
. . . L P . T I V A G - - - - - - - - K M S T S
---------CAGATC---AGGGAACAGCTTGGT------------------------ACCACGACTTGTACT
337338339340341342343344345346347348349350351352353354355356357358359360
R G W V V W V K D F T K L F P A D L L R Y Y L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V V S P L T R D A D F S W G D F R D R V N N E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V A N L G N F V Y R T L S F I Y R F L D G N V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E A E T D Q E I V D K I K E T H Q R V T E H L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K F R F R E A L T E V L R L S K F G N E Y F Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
H E P W K L K D E D P E R C A E V L R G C A R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V K A L A V M L A P F L P D S A E K I W Q S L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Y E D S V H D V D W E E A L E D V E T K E I P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P E P I F P K V T E E D L E K A K A L L P E E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G E S E G Q D D E Y V S L E E F N R L D L R V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K I K E A E R V E G S D R L I K L R I D I G D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T V T A V A G L Y P T Y E P E E L V G R K V V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L A N I Q P K E M F G V R S E A M I L A V G D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668
P A L L T I D E S K R E V E P G E R I R
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_met_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K V F I T C A L P Y A N G P T H L G H L R S
- - - - F I T C . L P Y A N G P T H L G H L R .
------------TTTATCACCTGC---CTTCCATATGCCAACGGCCCCACGCATCTCGGTCATCTGAGG---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T Y I P A D I Y A R Y R R L R G D D V L F V C A
T Y I P A D I Y A R Y - - - - - - - - L F V C A
ACCTACATACCTGCAGACATATATGCGAGGTAC------------------------CTCTTCGTCTGTGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T D E H G T P I A V K A E A E G R T P L E V A T
T D E H G - - - - - - - - - - - - - - - - - - T
ACCGATGAACACGGA------------------------------------------------------ACC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R Y H E M I R G D L E R C D I S F D S F T R T T
R Y H E M I R G D L E R C D - - - - S F T R T T
CGCTACCATGAAATGATAAGGGGGGACCTTGAGAGGTGTGAC------------AGTTTCACCAGGACCACA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D E L H H E I A Q K F F L K L Y E K G F I Y E K
D - - - - - - - - - - - - - - - - - - - - - - -
GAT---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D I K Q L Y C G D C Q R F L P D R Y V E G T C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y C G S E G A R G D H C E G C G R H L E P L Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E D P R C M V C G S E P E V R D S R H Y F F R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N Q F Q D E I R E W I E G S E M P S N V R N Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I Q W L R E G L K D W I L T R D M E W G V Q V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L E G N E G K I I Y V W G E A F L G Y I S S A A
- - - - - - - - - Y V W G E A F L G Y I - - - -
---------------------------TACGTGTGGGGTGAGGCCTTCCTTGGCTACATC------------
265266267268269270271272273274275276277278279280281282283284285286287288
A W S K K T G R D W R E Y W D S G A I H F I G K
- - - - - - - - - - - - - - - - - - I H F I G K
------------------------------------------------------ATCCACTTCATCGGAAAG
289290291292293294295296297298299300301302303304305306307308309310311312
D I I Y H H A I F W P A L L M A Y G C R T P A N
D I I Y H . A I F W P A L L M A Y - - - - P . N
GACATAATATACCAC---GCCATATTCTGGCCAGCCCTCCTGATGGCGTAT------------CCC---AAC
313314315316317318319320321322323324325326327328329330331332333334335336
I I A G E Y L S L E G Q K M S T S K N W V V W T
I I A G - - - - - - - - K M S T S - - - - - - -
ATAATAGCCGGG------------------------AAGATGTCCACCAGT---------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S D F L E R F D R D L L R Y Y L T V N A P L T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D T D F S W D D F Q R R V N D E L A D V L G N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L H R T F S F T G R F F D G R V P A A G E L T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E D L E F L E S I R A A H D T V A E L L D K F Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F R D A L M H I I K L A K R G N K Y F N D Q E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
W K A V K E S P A R A S T C L H L C N L L A A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L G K L L R P F M P S A A G R I L S I M N L E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E A W G F H E L R E G Q V I E R A K P L F S K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T D E A I E E E K A K L I E E D D E V E T V T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D D F T T M D I R V G V I R S A E R I E G S D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L L K L I I D V G E R E M Q V V A G L A E K Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
P E D L V E R K I T V L V N L K P A K L F G V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S E G M V L A T G E S L N I L D P G D A E V G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651
R I R
- - -
---------
Class I
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_met_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I L V T A A L P Y S N G P I H L G H I A G A
- - - L V T A . L P Y S N G P I H L G H I A . A
---------CTAGTTACTGCG---TTGCCATATTCGAATGGGCCAATCCATTTGGGCCATATCGCT---GCT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y L P A D I F Y R F V K L K G Y N A L Y I C G S
Y L P A D I F Y R F - - - - - - - - L Y I C G S
TATCTGCCAGCAGATATATTTTATAGATTC------------------------TTGTACATATGTGGGTCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D Q Y G S P I E L N A I K L N I D P K D Y A S F
D Q Y G - - - - - - - - - - - - - - - - - - S F
GACCAATATGGA------------------------------------------------------TCATTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y R K I Q E E I F K K F N I K F D I Y S G T A E
Y R K I Q E E I F K K F . . . . D I Y S G T . E
TATAGAAAAATACAAGAAGAGATTTTCAAAAAATTT------------GATATATATTCAGGAACG---GAA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S N I H P I I V K E F F L S L F S A G L L I E K
S - - - - - - - - - - - - - - - - - - - - - - -
TCC---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E Q E L P Y D P K I K R F L P D R F V V G Q C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y C G Y E K A Y G D Q C E K C G R L L E P K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I N P K S A I T G E K V I F K K T R H L F F N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P K L K D K L K Q Y I E S K K D V W N D F T Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
W S L A L L D N F K E R A I T R D N K W G V K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P A K E M L E I L K K A L K E G K T P K D F G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L I D S T N E K D L E N H I K E Y E N K V L Y V
- - - - - - - - - - - - - - - - - - - - - - Y V
------------------------------------------------------------------TATGTA
289290291292293294295296297298299300301302303304305306307308309310311312
W F D A P I G Y I S F T F E T S P E Y R Y Y W D
W F D A P I G Y I - - - - - - - - - - - - - - -
TGGTTTGATGCGCCCATAGGGTATATA---------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E K E K P Y I V H F I G K D N I P F H T I F W P
- - - - - - - V H F I G K D N I P F . T I F W P
---------------------GTGCATTTTATTGGGAAAGACAATATTCCTTTC---ACAATATTTTGGCCT
337338339340341342343344345346347348349350351352353354355356357358359360
A L I I G R N L G Y K N I N H I L D F D I A L P
A L I I G . . . . Y - - - - - - - - - - - - - P
GCATTAATAATTGGG------------TAT---------------------------------------CCT
361362363364365366367368369370371372373374375376377378379380381382383384
Y Q V F G N P Y L N Y Y G K K F S K S K R W G V
. Q V F G N - - - - - - - - K F S K S - - - - -
---CAAGTATTTGGTAAT------------------------AAATTCTCAAAAAGC---------------
385386387388389390391392393394395396397398399400401402403404405406407408
F L D N I D K I D I D I D Y F R F Y L A Y I H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V S K D M S F E W D Q F K E V I N K E L V D N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G N F I H R V L T F I Y N R F N G I P P K I E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L D D K D K E L L D K I K Q L P E K V F N F I W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K G E I G N A L R E I V N T S N L A N K Y F Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K E P W K T N D P N T I A I A F E A V K T F I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L L Y P F I P E K A K L L A S I A N I D I K W D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F N Q K V E K I N K P F I V F H K L S D N Q I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
M A K Q I L T N P K E Y D L G K K K V I G V L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Y E D E L Y K I E L E C D D N P W V C L K R E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D K R K I K Y I Y D T V K G D V P P H I I D G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
T Y I Y L L P A L E K P N L E K A E E E Y G L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S Y L D F A K L D M R V G K I I D V Q D H P N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
D K L Y I I K V S L G N K Q K T L V G G L K Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Y K K E E L I G K Y V V L I N N L K P K Q L R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
I T S E G M L L A A D D G K E V A L L M P D K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776
I S L G S K V R
- - - - - - - -
------------------------
Class I
Archaea/Archaeoglobus fulgidus/amino acid sequences/met_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K L V T C G L P Y A N G K A H V G H L R T Y V
- - L V T C . L P Y A N G K A H V G H L R T Y V
------CTCGTCACCTGC---TTACCTTACGCTAACGGCAAGGCTCATGTCGGGCACCTCAGGACGTACGTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P A D V Y V R Y L R M A G E E V V F V C G S D C
P A D V Y V R Y - - - - - - - - V F V C G S D C
CCCGCTGACGTTTACGTCCGATAT------------------------GTTTTCGTTTGCGGGAGCGACTGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H G T P I V V N A E Q Q G L S P K E L V D I Y H
H G - - - - - - - - - - - - - - - - - - D I Y H
CACGGC------------------------------------------------------GATATATATCAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E H F I K I F D A L N I K F D F Y G R T D S D Y
E H F I K I F D A L . . . . D F Y G R T D S - -
GAGCACTTCATCAAGATTTTTGACGCTTTG------------GACTTCTACGGCAGAACGGACAGC------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H H H R T T E I V K R L I E K G Y V Y P K E I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L A Y C P K C Q R F L P D R Y V E G I C P Y C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A L A R G D E C D Q G C G R H L E P G E I K E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R C K I C G S K A E F R S Q R H Y F F K L T E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q D F L E D Y L S K L K G T E N A L N Y A R N W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V K N L R D W C I T R N L E W G V R F P G E P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L V V Y V W V D A P I G Y I S F T E R A C E E K
- - - Y V W V D A P I G Y I - - - - - - - - - -
---------TACGTCTGGGTTGATGCCCCCATAGGCTACATC------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G C D W R K I W I D G D A E I I H F I G L D I V
- - - - - - - - - - - - - - - I H F I G L D I V
---------------------------------------------ATCCACTTTATAGGCCTCGACATCGTT
289290291292293294295296297298299300301302303304305306307308309310311312
Y H H C I F W P A M L K G A D Y A L P S A V V A
Y H . C I F W P A M L K G . . Y - - P . A V V A
TACCAC---TGCATTTTCTGGCCTGCGATGCTGAAAGGA------TAC------CCT---GCGGTGGTGGCG
313314315316317318319320321322323324325326327328329330331332333334335336
S G M V K V E G K T F S K S R G Y V V W V E E D
S - - - - - - - - T F S K S - - - - - - - - - -
AGC------------------------ACCTTCTCGAAGTCG------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y L K S G L S P D Y L R Y Y I V N Y T S H Q K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L N F S W E V F R E K V N N E V I A T L G N F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y R V L L F A W K N F G E V R M E G V D E E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E K I R E T E Q K I L S A L E E W E F K A A S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A F M E L A T Y G N V Y F Q N A K P W E L I K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D K E A A R R A V A S C L Q L A K A L I I F A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P V M P E S M E R M A K A I G L D L E N V R L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D A Y K V D E V M K L S K P E V P F A K V E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V I E K L Q K V M E K R F R G E E G E K M E Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E E I S I E D F Q K L D I R I G R V L K A E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K K S K K L I K L I I D I G D E Q R Q I V S G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A E D Y T P E E L E G K L V V V L A N L K P A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
F M G V E S R G M I L A A E K D G K A I L L T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659
E K E V E P G T R V C
- - - - - - - - - - -
---------------------------------
Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_met_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A R W V V T S A W P Y V N N V P H L G N L I G
- - - - V V T S . W P Y V N N V P H L G N L I .
------------TAGTGGAGGCCT---CTCCATGACGCGTTTTCTGGCTTCTGCTAGTAGTTCTTTAAC---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S I L S A D V F A R Y L R L R G E D V V F V S G
S I L S A D V F A R Y - - - - - - - - V F V S G
CTCGGGGAAGTCGCTGGGCAGCTTGCGGAAGAG------------------------GCCCGGCTTGAGCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S D E H G T P I E I E A I R R G V E P K Q L T D
S D E H G - - - - - - - - - - - - - - - - - - D
TGGCTTAGATGCTTC------------------------------------------------------CCT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q A H E Y V S K L F Q E Y R I S F D N Y T R T E
Q A H E Y V S K L F Q E Y . . . . D N Y T R T E
TTCGGCGGCGTCTGGTGTGAAGGGTGCTAGAAGTACTGC------------GGCGTTGGCGGCCACATACAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S P V H K N F V Q E F M M K L Y Q N G Y I F E Q
S - - - - - - - - - - - - - - - - - - - - - - -
AGT---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D D V L P Y C P R D R M F L P D R F V V G T C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y C G F E K A Y G D Q C D N C G R L L H P T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K N P R C A I C G G P V E F R K S R H W F F D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P K L Q E R L L R W L Q E S R L P P N V K N Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L N W V K E G L K P R S V T R D N K W G I P A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F P G A E G K T I Y V W F D A L L G Y V S A T K
- - - - - - - - - Y V W F D A L L G Y V - - - -
---------------------------CTCTGTCGAGGATATGTACCATGGCAGTGTATA------------
265266267268269270271272273274275276277278279280281282283284285286287288
E Y G I K K K S D D E L W K R Y W F D K E T R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V Y F I G K D N I P F H A I I L P A M F M A S G
V Y F I G K D N I P F . A I I L P A M F M A . .
AGTCTCCTTATCAAACCAATAACGCTTCCAAAG---ATCGTCACTCTTTTTCTTTATACCATATTC------
313314315316317318319320321322323324325326327328329330331332333334335336
D P Y T L P W Y I S S T E Y L M Y E G E Q F S K
. . Y - - P . Y I S S T - - - - - - - - Q F S K
------TAC------TAG---CGCATCAAACCAGAC------------------------CGGGAAGGGTGC
337338339340341342343344345346347348349350351352353354355356357358359360
S R R W G I W M D E A L E L L P A D Y W R F T L
S - - - - - - - - - - - - - - - - - - - - - - -
TGG---------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I K M R P E T K D T N F T W S E F T R I V N S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
M N D D I G N F V H R V L K F I K S R F G N K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P E P S N M K E L D K E Y L D Y I L L A P N R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G S Y I E S F R L K Q A L E E V V E L A R R G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q Y L N A K A P W E K I K T D P P D A A T T M Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V A A N A V A T L A V L L A P F T P D A A E R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
W R M L N M E G S V H R S G R W L E A S K P L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K P G H V L G E P E P L F R K L P S D F P E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573
K E L L A E A R K R V M E K R P P L L R W
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_met_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V R Y M V T S A L P Y A N G P I H A G H L A G
- - - - M V T S . L P Y A N G P I H A G H L A .
------------TGCTCCCAACTT---CTCTTTGTCGGGCATCAGTAAAGCAACGTTCTCGCCATCGTC---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A Y L P A D I F V R Y L R L K G E D V V F I C G
A Y L P A D I F V R Y - - - - - - - - V F I C G
GGCCAGGAGCATTCCCTGGCTTTCAACCCCTCT------------------------AACAATAATGACGTA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T D E H G T P I S F R A L K E G R S P R E I V D
T D E H G - - - - - - - - - - - - - - - - - - D
CTTGTTGAGCAATTC------------------------------------------------------CAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E F H E H I K I T F Q R A K I S F D F F G R T E
E F H E H I K I T F Q R A . . . . D F F G R T E
GTCAACTTTAACTATATATAGCTTGTCTGCATTTGGATG------------GATTATCTTCCCTACCCTAAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L P I H Y K L S Q Q F F L K A Y E N G H L V K K
L - - - - - - - - - - - - - - - - - - - - - - -
GTC---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V T K Q A Y C E H D K M F L P D R F V I G T C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F C G A E N Q R G D Q C E V C G R P L T P E I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I N P R C A L C G R P I S F R E S A H Y Y I K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q D F A E K L K R W I E N Q P W K P N V K N M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L K W I E E G L E E R A I T R D L N W G I P V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L D E E D M K N K V L Y V W F E A P I G Y I S I
- - - - - - - - - - - Y V W F E A P I G Y I - -
---------------------------------TTTATGGTCGAAGTACTTATTACCGAATGATGC------
265266267268269270271272273274275276277278279280281282283284285286287288
T M E Y F K R L G K P N E W K K Y W L N I D S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T R V I H F I G K D N I P F H A I F W P A F L M
- - - I H F I G K D N I P F . A I F W P A F L M
---------GAGGGCTTGTCTATCTAGCTCATCGAGTTCTCC---CTCTGGGACTATCCCATCAAAGTACCT
313314315316317318319320321322323324325326327328329330331332333334335336
A Y G K Y K D E E V E A E W N L P Y D I P A N E
A Y - - - - - - - - - - - - - - P . D I P A N -
GTTCAC------------------------------------------GAG---CTCGTTTATCCTAGT---
337338339340341342343344345346347348349350351352353354355356357358359360
Y L T L E G K K F S T S R N W A I W V H E F L D
- - - - - - - K F S T S - - - - - - - - - - - -
---------------------TGAATCTCTAGTTTC------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V F P A D Y L R Y Y L T T I M P E T R D S D F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F A E F K T R I N E E L V N N L G N F V H R A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T F V N R Y F D G I V P E R G E L D E L D R Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L E E I E K A F E E V G E L I M N Y R F K D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K R V M E L A S F G N K Y F D H K Q P W K T A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E D R A R T G T T V N I S L Q I V K A L G I L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E P F L P D A S E K I W H L L N L D E V K K W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F K E L P A G H R V R K A E I L F K K V T D E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I I Y F I L N Y M G R N N P E G A K M L L E K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Y K R E D V I K V A K E K F G E E S K I I L K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I Y K D I K L E E G K E E K E M E Y V K F E D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A K L D L R V G K I I E V K D H P N A D K L Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
V K V D L G K E V R T L V A G L K K Y Y K P E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L L N K Y V I I V A N L E P K K L R G V E S Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
M L L A A D D G E N V A L L M P D K E V K L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723
K V R
- - -
---------
Class I
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_met_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D E T R F D R I L V T A A L P Y A N G P I H I
- - - - - - - - - L V T A . L P Y A N G P I H I
---------------------------CTGGTGACGGCG---CTGCCCTACGCGAACGGTCCCATTCACATC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G H L A G A Y L P A D L Y C R Y Q R L K G R D V
G H L A . A Y L P A D L Y C R Y - - - - - - - -
GGCCACCTGGCC---GCCTACCTGCCGGCCGATCTGTACTGCCGCTAC------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F I C G S D E L G V A I L M R A L E E G T T P
L F I C G S D E L G - - - - - - - - - - - - - -
CTGTTCATCTGCGGATCGGACGAACTGGGT------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q A I V D R Y H P M I R D S F A R F G M S F D Y
- - - - D R Y H P M I R D S F A R F . . . . D Y
------------GATCGTTATCATCCGATGATCCGCGACAGCTTCGCCCGCTTC------------GACTAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y G R T T S P V H F E T S Q D F F R W L D E K G
Y G R T T S - - - - - - - - - - - - - - - - - -
TACGGGCGCACGACCTCG------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V F K L K T E K Q L Y D P E A G I F L A D R F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R G T C P I C G Y E D A Y G D Q C E R C G S S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S P T D L I N P R S V L S N A T P E L R E T T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W Y L P L G D F Q P K L E A W I A T H P E W K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N V L G Q V R S W L Q Q G L R D R A V T R D I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
W G V P V P E D V A R R H G V P A E G K V L Y V
- - - - - - - - - - - - - - - - - - - - - - Y V
------------------------------------------------------------------TACGTC
265266267268269270271272273274275276277278279280281282283284285286287288
W F D A P I G Y I S A T R E W A Q Q Q G D P E A
W F D A P I G Y I - - - - - - - - - - - - - - -
TGGTTCGACGCCCCCATCGGGTACATC---------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
W R R Y W Q D E R T R L I H F I G K D N I V F H
- - - - - - - - - - - - I H F I G K D N I V F .
------------------------------------ATTCATTTCATCGGAAAGGACAACATCGTCTTC---
313314315316317318319320321322323324325326327328329330331332333334335336
C L M F P A M L M A H G E F V L P D N V P A N E
C L M F P A M L M A H - - - - - P . N V P A N -
TGCCTGATGTTTCCCGCCATGCTCATGGCGCAT---------------CCC---AACGTGCCGGCCAAC---
337338339340341342343344345346347348349350351352353354355356357358359360
F L N L E G H K L S T S R G W A V W L H E Y L E
- - - - - - - K L S T S - - - - - - - - - - - -
---------------------AAGCTCTCGACCAGC------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E F P P D L L R Y A L A T M L P E T R D A D F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
W K E F Q Q R V N A E L A D I L G N F V H R T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T F A Q R F A E G R V P P L R N A R P V D E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L R E L A T F P E R I G S A Y E Q F R F R E A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q E T M N L A R L G N K Y F N D T E P W H T R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T D P Q A C A N T I H V S L Q I C A S L S I L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E P V L P F A A A R L R E M L R L E G V R P S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P D G E G A L G W D D A A R P L L P E G H E I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R P E I L F T K I E D E V I E R Q I A R L E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A Q Q A A A K T D G P P Y A P L K P E I V Y D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
F D R L D L R V G R V E K A E R V P K S K K L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
R L E V D L G F E K R Q I L A G V A E Q M A P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D L E G R R V V V V A N L K P R K M M G L E S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G M L L M A E D R E G R L V P V T A E S E P G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699
V V R
- - -
---------
Class I
Archaea/Staphylothermus marinus/Smarinus_met_aa
Archaea/Staphylothermus marinus/Smarinus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M M S I F Y I T T P I Y Y P N A P P H I G H A Y
- - - - - Y I T T . I Y Y P N A P P H I G H A Y
---------------TACATAACAACA---ATATATTATCCAAACGCACCACCCCATATAGGGCATGCTTAC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T T V F A D V L A R Y H R L I G D E V F F M T G
T T V F A D V L A R Y - - - - - - - - F F M T G
ACAACGGTTTTCGCCGATGTCTTGGCGAGATAT------------------------TTCTTTATGACTGGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N D E H G L K L Q R A A E K K G V H P K Q F V D
N D E H G - - - - - - - - - - - - - - - - - - D
AATGATGAGCATGGA------------------------------------------------------GAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E M A D V Y K K Y W E L L D I S Y D Y F I R T T
E M A D V Y K K Y W E L L D - - - - Y F I R T T
GAAATGGCTGATGTTTATAAGAAGTATTGGGAATTGCTTGAT------------TACTTTATACGTACAACG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D D Y H E K V V K T A I Q K L Y D K G L V Y K A
D - - - - - - - - - - - - - - - - - - - - - - -
GAT---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S Y A G W Y C V D C E K F Y S P G E Y I E I N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K P H C P I H K K P L E W L E E E T Y Y F K L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E F E D F I I D V L K N K D I V Y P R S Y A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V L G K V E K E G L R D V S I A R P K E R V W W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G I E V P F D K N Y T V Y V W F D A L L N Y I S
- - - - - - - - - - - - Y V W F D A L L N Y I -
------------------------------------TATGTATGGTTCGACGCGCTCCTAAACTATATT---
241242243244245246247248249250251252253254255256257258259260261262263264
G I G Y L E D M D R F N K Y W P N V H H V I G K
- - - - - - - - - - - - - - - - - - H H V I G K
------------------------------------------------------CACCATGTTATCGGAAAA
265266267268269270271272273274275276277278279280281282283284285286287288
D I L W F H T V V W F S I L K A L D I E L P K K
D I L W F . T V V W F S I L K A L - - - - P K .
GATATCTTATGGTTC---ACAGTAGTATGGTTTTCGATACTTAAAGCACTA------------CCAAAG---
289290291292293294295296297298299300301302303304305306307308309310311312
L L V H A F L I N R G L K I G K S A G N V I A I
L L V H - - - - - - - - K I G K S - - - - - - -
CTGCTGGTTCAT------------------------AAAATAGGTAAGAGT---------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E D L I D R Y Q D S D G V R Y I L M R V F N M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K D V D V S T E L F D S I Y N S E L A D T L G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L V R R I G V L A K K K L G G I V Y K R E V D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E L S T S I V E T L N K Y N E Y M E A Y D V S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A I Q V V M D L L R K A N A Y V N L T R P W E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
M D P G K E L Y S L L E T I R A S T T M L Y P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I P K A A S K V S K A F G Y R I G N P S E Y V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500
G E I E R Y N I V D A P I L F R K I K Q
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_met_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A R W V V A S A W P Y V N N V P H L G N L I G
- - - - V V A S . W P Y V N N V P H L G N L I .
------------GTAGTAGCGTCT---TGGCCCTACGTCAACAACGTGCCGCACCTAGGCAACCTTATC---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S V L S A D V F A R Y L R L R G E D V V F V S G
S V L S A D V F A R Y - - - - - - - - V F V S G
TCAGTGCTCTCTGCCGACGTGTTCGCCCGCTAT------------------------GTGTTCGTGAGCGGG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S D E H G T P I E I E A I K R G V H P R Q L T D
S D E H G - - - - - - - - - - - - - - - - - - D
AGCGATGAGCACGGT------------------------------------------------------GAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q A H E Y V S R L F R E F R I S F D N Y T R T E
Q A H E Y V S R L F R E F . . . . D N Y T R T E
CAGGCCCACGAGTACGTGTCCAGGCTCTTCAGGGAGTTC------------GACAACTACACACGCACCGAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S P V H R E F V R E F M M K L Y E N G Y I F E Q
S - - - - - - - - - - - - - - - - - - - - - - -
AGC---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D D I L P Y C P R D K M F L P D R F V V G T C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y C G Y P Y A H G D Q C D N C G R L L H P T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K N P R C A I C G G P V E F R K S K H W F F D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S K L Q D R L L K W L E E S N L P P N V K N Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L N W V R E G L K P R S V T R D N K W G I P A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F P G A E G K T I Y V W F D A L L G Y I S A T K
- - - - - - - - - Y V W F D A L L G Y I - - - -
---------------------------TATGTATGGTTTGACGCTCTCCTTGGCTACATA------------
265266267268269270271272273274275276277278279280281282283284285286287288
E Y G L K K G D E S L W K R Y W F D K E T R T V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GTA
289290291292293294295296297298299300301302303304305306307308309310311312
Y F I G K D N I P F H A I I F P A M L M A S G D
Y F I G K D N I P F . A I I F P A M L M A . . .
TACTTCATAGGCAAGGACAACATACCCTTC---GCCATAATATTCCCGGCGATGCTCATGGCC---------
313314315316317318319320321322323324325326327328329330331332333334335336
P Y T L P W Y I A S T E Y L M Y E G E Q F S K S
. . . L P . Y I A S T - - - - - - - - Q F S K S
---------CTCCCA---TATATAGCCTCGACC------------------------CAGTTCTCCAAGAGT
337338339340341342343344345346347348349350351352353354355356357358359360
R R W G I W I D E A L E I L P A D Y W R F A L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K M R P E T R D T N F T W K E F T R I V N S D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N D D I G N F V H R V L K F I K S R F G G R V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E P G E M K E L D R D Y L D Y T L K A P E R V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S Y L D S F R L K Q A L D E V V E L A R H G N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Y L N A K A P W D K I K T E P S D A A T T M Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A A N A V A T L A V M L A P F T P D A A E R L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R M L N M R G S V H E P G R W R E A S R P L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P G H E I G E P E P L F R K L A N D F P E K V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572
E I L E E A R K K V M E K R P P L L R W
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_met_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P E H I L V A V A W P Y A N G P R H I G H V A
- - - - - L V A V . W P Y A N G P R H I G H V A
---------------TTGCATCCGCGC---CTCCTCTTCGATCACCTTTTCATCGAGCTTCTTGAAGAGCGG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G F G V P A D I F A R Y H R L R G N R V L M V S
. F G V P A D I F A R Y - - - - - - - - L M V S
---CGGCTGGCGTAATACCTGCCCCACCGGTAACAC------------------------CCGATCGTAGTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G T D E H G T P I T L V A D K E G T T P Q A I A
G T D E H G - - - - - - - - - - - - - - - - - -
ACCGGTCAAGACCCGATG------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D R Y N K I I G D D L Y N L G L S Y D T F T R T
D R Y N K I I G D D L Y N L . . . . D T F T R T
GCCGTTATAGCCCAAGTACTCGTGCAGGCGCTGGCTGGAGAA------------CGTAAAGATGATCTTGAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T T A N H Y A V T Q D I F R T L Y E R G Y I I R
T T - - - - - - - - - - - - - - - - - - - - - -
CGTATC------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q E T L G A F S A T T G R T L P D R Y I E G T C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P L C G Y D E A R G D Q C D N C G S Q L D P T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L I N P R S K V D G Q P P V F K P T E H F F L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L P A F A E Q L H D W I N R Q D H W R P N V R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F S L N F L K D L K P R A I T R D L E W G V P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P L P E Y A N R D D K K I Y V W F D A V I G Y L
- - - - - - - - - - - - - Y V W F D A V I G Y L
---------------------------------------CTCCATCGTCAAAAACTCACTCGAGACGACGTT
265266267268269270271272273274275276277278279280281282283284285286287288
S A S I E W A Q N S G Q P D A W R E W W Q N P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A R H F Y F M G K D N I V F H T V I W P A M L L
- - - F Y F M G K D N I V F . T V I W P A M L L
---------CATCGCCGGCCAGATGACGGTATGGAAAACAAT---GTCTTTGCCCATGAAGTAAAAGTGACG
313314315316317318319320321322323324325326327328329330331332333334335336
G Y G A G G Q F G A D P G G K Y D G I P L Q L P
G Y - - - - - - - - - - - - - - - - - - - - - P
CGCATC---------------------------------------------------------------GGC
337338339340341342343344345346347348349350351352353354355356357358359360
Y N V V S S E F L T M E G K K F S S S R G I V I
. N V V S S - - - - - - - - K F S S S - - - - -
---GAGATAACCGATGAC------------------------TTTGTCGTCGCGGTT---------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y V N D F L S R Y D A D A L R Y F L T I A G P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N Q D T D F T W A E F V R R N N D E L V A T W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N L V N R T L S N V Y K N F G S V P Q P G P L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P V D E Q V L A E V T G G I E T V G E L L A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R F K A A L A E A M R L A A Q V N I Y L S E Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P W K V I K S D H E R A A T I W Y V A L R C V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T L K I I F T P F L P F S S Q R L H E Y L G Y N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G Y I A G P L T F R E V T E A N G R T H R V L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G D Y D R W V G R W E P S V L P V G Q V L R Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Q P L F K K L D E K V I E E E L A R M Q S R L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_met_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R Y I T T P I Y Y V N D V P H L G H A Y T T I
- - Y I T T P I Y Y V N D V . H L G H A Y T T I
------CACTAAAGAGCCGTTTTGCACAAGTTGTTCAGGGGC---TAAAACAAGTTTATCTCCGCTTTTTGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I A D T L A R F Y R L Q G H E T R F L T G T D E
I A D T L A R F - - - - - - - - R F L T G T D E
AGAAAGTATCATACCATCGCTTTC------------------------AAGATTGCTTATAACGCAAACTTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H G Q K I E E A A K L R N S T P Q E Y A D K I S
H G - - - - - - - - - - - - - - - - - - D K I S
TTTACC------------------------------------------------------TTCTTTATCGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F E F K K L W D E F E I T Y D I Y A R T T D T R
F E F K K L W D E F . . . . D I Y A R T T D - -
AAGTTCGAGTTGAAATTTTAAAAGTTTTTC------------ATTTTGACAATCAAGTACCTTAGC------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H I E F I K A M F L K M W Q K G D I Y K D E Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G H Y C I S C E S F F T Q S Q L I N D C S C P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
C G K Q T R I L K E E S Y F F K L S K Y Q D K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L Q W Y E E K D P I L P K N K K N E L I N F V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N G L K D L S I T R T S F D W G I K L P Q E I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D D K H I I Y V W L D A L F I Y V S S L D F Q N
- - - - - - Y V W L D A L F I Y V - - - - - - -
------------------TTCTTCTAAATAACGATTACACTGTAAGTTTTC---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K G E N A K F W P A H V H L V G K D I L R F H A
- - - - - - - - - - - V H L V G K D I L R F . A
---------------------------------GTAAAATTTTAAAACACCTTCTTTTGAAATATT---TTG
265266267268269270271272273274275276277278279280281282283284285286287288
I Y W P A F L M S V D L P L P K F I G A H G W W
I Y W P A F L M S V - - - - P . F I G A H - - -
AGAATATTTTGTACTCATACCTATAATGCG------------TCC---TTCATTGCTAAGCTC---------
289290291292293294295296297298299300301302303304305306307308309310311312
T K E G E K M S K S K G N V V K P K E V V D A Y
- - - - - K M S K S - - - - - - - - - - - - - -
---------------ATTTTCGCTAAAATC------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G S E A F R Y F L L R E V P F G N D G D F S E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
M L I N R I N A E L S N E F G N L L N R I I G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S T K Y S Q G N I S K E G V L K F Y N A E L N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A K E H L N L A V E F L E N L Q C N R Y L E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F K A L S V A N L A I S K Y E P W S L I K E N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
H E Q A N A L V A L C A N I L A K T S L L L S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T L P K S S Q K V A L A L N F E I S S A N Y T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M I L D N E L L D F K A N P C E A L F P K V E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A L L K Q E I K E E P K K E E S P K I K I D D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A K I E I K V A K V L D C Q N I E G S E K L L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F Q L E L D D K E I R Q V L S G I A K Y Y K A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D L I G K Q V C V I S N L K K A K I F G H E S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G M I L S A K S G D K L V L I A P E Q L V Q N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628
S L V G
- - - -
------------
Class I
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_met_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S S D R E K P G V F Y V T T P I Y Y V N D R P
- - - - - - - - - - - Y V T T . I Y Y V N D R P
---------------------------------TACGTCACCACG---ATCTACTACGTGAACGACAGGCCC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
H L G H V Y T T L V A D V A A R F H R L R G D D
H L G H V Y T T L V A D V A A R F - - - - - - -
CACCTCGGGCACGTCTACACGACGCTGGTCGCCGACGTGGCCGCCCGCTTC---------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V F F L T G V D E H A A K V S D R A A E N G M G
- F F L T G V D E H A - - - - - - - - - - - - -
---TTCTTCCTCACCGGCGTGGACGAGCACGCG---------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P Q A W A D R N A L A F R E T F D K L R L T F D
- - - - - D R N A L A F R E T F D K L . . . . D
---------------GACCGCAACGCGCTGGCGTTCCGGGAGACCTTCGACAAGCTG------------GAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D F V R T S S D R H K E R V T A Y V T E L L A S
D F V R T S S - - - - - - - - - - - - - - - - -
GACTTCGTCCGCACCAGCAGC---------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G D V Y E G R Y E G W Y D A G Q E E Y V P E N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A E A Q G F R S E V N G K P L V K K S E T N Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F R L S A Y R E R V L A H I E A H P G F V Q P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A R R N E V V N R I K E A Q D V P I S R T G A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L G A D G R R W G I P V P G D A E Q T I Y V W I
- - - - - - - - - - - - - - - - - - - - Y V W I
------------------------------------------------------------TACGTGTGGATC
241242243244245246247248249250251252253254255256257258259260261262263264
D A L F N Y L T Y A D D E H R R R Y W Q A G A T
D A L F N Y L - - - - - - - - - - - - - - - - T
GACGCGCTCTTCAACTACCTC------------------------------------------------ACG
265266267268269270271272273274275276277278279280281282283284285286287288
H Y I A K D I L W F H A A I W P A L L L A L R E
H Y I A K D I L W F . A A I W P A L L L A L - -
CACTACATCGCCAAGGACATCCTCTGGTTC---GCGGCGATCTGGCCGGCCTTGCTGCTTGCCCTT------
289290291292293294295296297298299300301302303304305306307308309310311312
R P G Y G W V N L P Q T V F T H S Y W V S D S G
- - - - - - - - - P . T V F T H - - - - - - - -
---------------------------CCC---ACGGTCTTCACGCAC------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E K M S K S L G N F L D P E A I D R A V E A Y G
- K M S K S - - - - - - - - - - - - - - - - - -
---AAGATGAGCAAGAGC------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I D A L R Y F L A T K G P L G T T D A S F S A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L F D T V Y H S D L A N T F G N S A S R V T N M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L V R Y C G G A V P C A A D R G G G L A E E A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R A V A A A T A A Y D A G D L E G A A E A A L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L V R R V D A Y V E A T Q P F K M W K A E E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A E V G P I L A R C V E A L R V A S V L L W P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T P H K V E D F W S R I G C G A Q A E A L A D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G R G D L A A W A A W G G L A A G M A V Q K G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539
A L F P R V E P A P V
- - - - - - - - - - -
---------------------------------
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_met_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P S T F A L T T P L Y Y V N D V P H I G S A Y
- - - - - A L T T . L Y Y V N D V P H I G S A Y
---------------GCCCTGACGACT---CTCTACTACGTCAACGATGTGCCGCACATCGGCAGTGCCTAC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T T I A A D A I A R F H R L Q G D R V L M I T G
T T I A A D A I A R F - - - - - - - - L M I T G
ACCACGATCGCGGCGGATGCGATCGCTCGTTTC------------------------TTGATGATCACCGGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S D E H G Q K I Q R T A E K N G K P P Q E H C N
S D E H G - - - - - - - - - - - - - - - - - - N
AGCGACGAGCATGGC------------------------------------------------------AAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A I V A R F Q D L W Q L L N I R Y D R F S R T T
A I V A R F Q D L W Q L L . . . . D R F S R T T
GCGATCGTGGCTCGCTTCCAAGACCTCTGGCAGCTGCTC------------GACCGCTTCAGCCGCACCACC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D P R H Q A I V E V F Y R R V E A Q G D I Y V G
D - - - - - - - - - - - - - - - - - - - - - - -
GAT---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R Q Q G W Y C V A C E E F K E E R D L L E D K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
C P I H T N Q A V E W R D E E N Y F F R L S R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q E A L E A H Y A A N P D F I Q P E S R R N E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L S F V E R G L Q D F S I S R V N L E W G F A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P D N P K H T L Y V W F D A L L G Y V T A L L D
- - - - - - - - Y V W F D A L L G Y V - - - - -
------------------------TACGTCTGGTTTGATGCGCTGCTGGGTTATGTG---------------
241242243244245246247248249250251252253254255256257258259260261262263264
P D A E P T L E N A L S Q W W P I N L H L I G K
- - - - - - - - - - - - - - - - - - L H L I G K
------------------------------------------------------CTGCACCTGATCGGCAAA
265266267268269270271272273274275276277278279280281282283284285286287288
D I L R F H A V Y W P A M L L S A G L P L P D R
D I L R F . A V Y W P A M L L S A - - - - P . R
GACATTCTGCGTTTC---GCGGTCTACTGGCCGGCGATGTTGCTTTCGGCA------------CCC---CGC
289290291292293294295296297298299300301302303304305306307308309310311312
V F G H G F L T K D G L K M G K S L G N T L D P
V F G H - - - - - - - - K M G K S - - - - - - -
GTCTTTGGTCAT------------------------AAGATGGGCAAGAGT---------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F D L V D R F G S D A V R Y Y F L K E I E F G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D G D Y Q E T R F V N V V N A D L A N D L G N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L N R T L S M A K R Y C Q L Q I P L G S T A I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A D N P L R Q Q G E A L T D S V K S A Y D R L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F S E A C G Q I L A L V Q A G N R Y L D Q E A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
W T R F K Q G E Q A K V E E I L Y T V L E S V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L A A Y W L S P L V P G I S Q E I Y R Q L G L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A D F N D P A I A Q Q L D P E S H G H W G F L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525
A A Q Q F L D P S P V F R S L E L A P A D
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_met_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A K N I L V A V A W P Y A S G A R H L G H V A
- - - - - L V A V . W P Y A S G A R H L G H V A
---------------TTCGAGCTTTTT---CAGCACGCTTGGGGCGGCCAACTCACGACCTGCGGGCAGATC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G F G V P S D V F A R Y Q R L V G N N V L M V S
. F G V P S D V F A R Y - - - - - - - - L M V S
---CCATTCCCAGCGGCCAATCCAAGTACTAGGTTC------------------------CTGGCTTTCTTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G T D D H G T P I T V R A D R E G K T P R E V T
G T D D H G - - - - - - - - - - - - - - - - - -
GCGTTCTTCAAACAGCAA------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D F Y N A E I R N N L R D L G L S Y D L F T R T
D F Y N A E I R N N L R D L . . . . D L F T R T
GAAGGGCAAAAATGGCGTAAACAAGGTGCGCAAATTATTAAT------------AACATACAAAATCGTGCC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S T E N H Y Q I T Q A F F T R L Q E K G Y I F A
S T - - - - - - - - - - - - - - - - - - - - - -
ACCGCG------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q E M I G T Y S E A D K R F L P D R Y V E G T C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P H C G Y T K A R G D Q C D N C G K Q L D P V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L I E P R S T L S G A T P V F K P T T H F F L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L P A F V E R L R E W I E S Q N H W R P N V K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F S L G L L D D V P A R A I T R D L T W G V P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P V E G D E F D S K R I Y V W F D A V I G Y L S
- - - - - - - - - - - - Y V W F D A V I G Y L -
------------------------------------GACGACCTCATAGGGCAATTCCAATTCGCCATG---
265266267268269270271272273274275276277278279280281282283284285286287288
A A V E W S I K V G R P E A W R D W W L N S D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R H Y Y F M G K D N I V F H S V I W P A M L I G
- - Y Y F M G K D N I V F . S V I W P A M L I G
------GTTGAGCCACCAATCGCGCCAAGCCTCAGGCCG---AACCTTGATCGACCATTCAACTGCTGCTGA
313314315316317318319320321322323324325326327328329330331332333334335336
H G E L E L P Y E V V S S E F L T L A G G E K I
H - - - - - P . E V V S S - - - - - - - - - K I
AAG---------------ATC---CCACACATAAATTCG---------------------------CGGAAT
337338339340341342343344345346347348349350351352353354355356357358359360
S S S R A E G N S I P F V G E F L A Q Y D P D P
S S S - - - - - - - - - - - - - - - - - - - - -
TGGCACGCC---------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L R Y F L V I A G P E T S D T E W S L G E F I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R N N E E L V A T W G N L V N R V L S I T H K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F G H V P T P Q A L T A E D E A A L A T V R A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F E T V G K E L E Q A H F K A G L I A T M A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R S V N E Y L A S Q E P W K V L K T D R E R G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T I L Y V A L Q A I N N L R T L F T P F L P F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S Q K L H E L L G N E G Y L A G P L L F E E R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E S Q H S H E V L T C E P S T W I G R W E W S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574
L P A G R E L A A P S V L F K K L E L P T E
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_met_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A K E T F Y I T T P I Y Y P S G N L H I G H A
- - - - - - Y I T T . I Y Y P S G N L H I G H A
------------------TATATAACAACC---ATATACTATCCTAGTGGGAATTTACATATAGGACATGCA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y S T V A G D V I A R Y K R M Q G Y D V R Y L T
Y S T V A G D V I A R Y - - - - - - - - R Y L T
TATTCTACAGTGGCTGGAGATGTTATTGCAAGATAT------------------------CGTTATTTGACT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G T D E H G Q K I Q E K A Q K A G K T E I E Y L
G T D E H G - - - - - - - - - - - - - - - - - -
GGAACGGATGAACACGGT------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D E M I A G I K Q L W A K L E I S N D D F I R T
D E M I A G I K Q L W A K L . . . . D D F I R T
GATGAGATGATTGCTGGAATTAAACAATTGTGGGCTAAGCTT------------GATGATTTTATCAGAACA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T E E R H K H V V E Q V F E R L L K Q G D I Y L
T E - - - - - - - - - - - - - - - - - - - - - -
ACTGAA------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G E Y E G W Y S V P D E T Y Y T E S Q L V D P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y E N G K I I G G K S P D S G H E V E L V K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S Y F F N I S K Y T D R L L E F Y D Q N P D F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q P P S R K N E M I N N F I K P G L A D L A V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R T S F N W G V H V P S N P K H V V Y V W I D A
- - - - - - - - - - - - - - - - - - Y V W I D A
------------------------------------------------------TATGTTTGGATTGATGCG
241242243244245246247248249250251252253254255256257258259260261262263264
L V N Y I S A L G Y L S D D E S L F N K Y W P A
L V N Y I - - - - - - - - - - - - - - - - - - -
TTAGTTAACTATATT---------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D I H L M A K E I V R F H S I I W P I L L M A L
- I H L M A K E I V R F . S I I W P I L L M A L
---ATTCATTTAATGGCTAAGGAAATTGTGCGATTC---TCAATTATTTGGCCTATTTTATTGATGGCATTA
289290291292293294295296297298299300301302303304305306307308309310311312
D L P L P K K V F A H G W I L M K D G K M S K S
- - - - P K . V F A H - - - - - - - - K M S K S
------------CCTAAA---GTCTTTGCACAT------------------------AAAATGAGTAAATCT
313314315316317318319320321322323324325326327328329330331332333334335336
K G N V V D P N I L I D R Y G L D A T R Y Y L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R E L P F G S D G V F T P E A F V E R T N F D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A N D L G N L V N R T I S M I N K Y F D G E L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A Y Q G P L H E L D E E M E A M A L E T V K S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T E S M E S L Q F S V A L S T V W K F I S R T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K Y I D E T T P W V L A K D D S Q K D M L G N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
M A H L V E N I R Y A A V L L R P F L T H A P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E I F E Q L N I N N P Q F M E F S S L E Q Y G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L T E P I M V T G Q P K P I F P R L D S E A E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A Y I K E S M Q P P A T E E E K E E I P S K P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I D I K D F D K V E I K A A T I I D A E H V K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
S D K L L K I Q V D L D S E Q R Q I V S G I A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
F Y T P D D I I G K K V A V V T N L K P A K L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G Q K S E G M I L S A E K D G V L T L V S L P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657
A I P N G A V I K
- - - - - - - - -
---------------------------
Class I
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_met_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K F Y I T T P I Y Y V N S E P H I G S A Y T T
- - - Y I T T . I Y Y V N S E P H I G S A Y T T
---------CTTCGCACCTGG---GATTTCTCCATCTACAGTCAAAAGTCTCAAGGTATCGCCGGACTTTGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I V A D I I A R Y K R F M G Y D V F F L T G T D
I V A D I I A R Y - - - - - - - - F F L T G T D
GGCGAGAAGCATTCCCTGAGACTCTAT------------------------ATTAGCGACAACGACGATCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E H G Q K V L Q A A Q Q A G K D P Q E F C D E L
E H G - - - - - - - - - - - - - - - - - - D E L
TTTTCCTAC------------------------------------------------------CGTTCCAAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A E K F K R L W K E L K I T N D Y F I R T T D E
A E K F K R L W K E L . . . . D Y F I R T T D -
ATCGATTATCAATCTGAGAAGTTTTCTGGAATT------------CGCTTCGAGGACCTTTGCGATTCT---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M H M K T V Q E F V A K M K E N G D V Y K G I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K G W Y C V P C E T F W N E D E V I K E G E E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F C P E C K R P V K W V E E E N Y F F R L S K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R D S L L K Y Y E E H P D F V E P D F R R N E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L K I L E G G L K D L S I T R T T F K W G V P M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K D D P E H V I Y V W V D A L I N Y I S A I G Y
- - - - - - - - Y V W V D A L I N Y I - - - - -
------------------------TGTGAGCCGGTAGGAATCCATGAGTTCATGGTA---------------
241242243244245246247248249250251252253254255256257258259260261262263264
G W N D E M F N K W W P A D L H L I G K E I N R
- - - - - - - - - - - - - - L H L I G K E I N R
------------------------------------------GGAAGGAGAAGGGAGTCTTCCGTTGAAATA
265266267268269270271272273274275276277278279280281282283284285286287288
F H S I I W P A M L M S V G L P L P K K V F A H
F . S I I W P A M L M S V - - - - P K . V F A H
CTT---TATCATAGCCGTGATCCTGTGAAGGAGATTTCC------------GAGATC---ATTCAATCTGTG
289290291292293294295296297298299300301302303304305306307308309310311312
G W L T V N G Q K I S K S L G N A I D P R F F V
- - - - - - - - K I S K S - - - - - - - - - - -
------------------------GCCGTCTTTTCCGAA---------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K R Y G N D V V R Y Y L I R D I M F G K D G D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S E E R L V H R L N S D L A N D Y G N L L H R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T A M I K K Y F N G R L P S P S A Q E G F D S W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L K E R F F E T K D A Y H E L M D S Y R L T E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L D K I W E F I A D V N K Y F N D T K P W I L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K E G N M E R L G T V L Y N S L E A V F K V A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
M T L P V M P D T S E E V F R R V S F E E K P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K E H L E N W G V L K P G S T V I H G E P L F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K I D A K D F K K V V E T V S A E Q N A I T I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D F S K V D L R I A K V L E A E K V P N S R K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L R L I I D L G T E K R Q I V A G I A E H Y R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E E L V G K L I V V V A N L K P A K L M G I E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q G M L L A A K S G D T L R L L T V D G E I T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629
G A K V S
- - - - -
---------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_met_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K M N L V T A A L P Y V N N I P H L G N L V
- - - - - L V T A . L P Y V N N I P H L G N L V
---------------GTTTGGAATATC---AGATAAAATTTTGTTCTTAGAATTTTCTAATATTAAATTTAT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q V L S A D A F A R Y S K M S G I E T L Y V C G
Q V L S A D A F A R Y - - - - - - - - L Y V C G
TCCGTTTATTTTAAGCTCTCCGTTTTCTGCTAC------------------------TATGTCAATTTTAGG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T D E Y G T A T E T K A L I E N T T P L E L C N
T D E Y G - - - - - - - - - - - - - - - - - - N
TGGGCAGGCAAGATC------------------------------------------------------TGA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K Y Y E I H K S I Y K W F N I E F D I F G R T T
K Y Y E I H K S I Y K W F . . . . D I F G R T T
ATCTTCTACAATTATAACTTTAAAATTTTTATTTTTGTC------------TAGCATTCCTTCAGATTTTAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N K N H Q D I V Q N F F L Q L E K N G Y I K E R
N - - - - - - - - - - - - - - - - - - - - - - -
TCC---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E T E Q F Y C N K D S M F L A D R Y V I G E C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E C Q S M A K G D Q C D N C S K L L N P T D L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N P K C I I C K N K P I L K K T N H L Y L D L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K I K T K L E K W I K N P D T S K N W N T N A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K M T K A F L R D G L K E R A I T R D L K W G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P V P K K G F E N K V F Y V W F D A P I G Y I S
- - - - - - - - - - - - Y V W F D A P I G Y I -
------------------------------------TAAGTCTCTGATTAGGTATATTAAGTTTGAGAT---
265266267268269270271272273274275276277278279280281282283284285286287288
I T K N I I K N W E S W W K N N D Q V N L V Q F
- - - - - - - - - - - - - - - - - - - - - V Q F
---------------------------------------------------------------ATTTCCAAG
289290291292293294295296297298299300301302303304305306307308309310311312
I G K D N I L F H T I I F P C I E I G S E E N W
I G K D N I L F . T I I F P C I E I G S - - - -
GGAAGAAATTTTAAGTATTTCTTT---AGCAGATTTTAGTTCTGTCTTTTTAAAAAGATT------------
313314315316317318319320321322323324325326327328329330331332333334335336
T I L N Q L S S S E Y L N Y E N L K F S K S E G
- - L . Q L S S S - - - - - - - - K F S K S - -
------TGG---TATTTGTTTCCAAAA------------------------TATTACATCTCCAAA------
337338339340341342343344345346347348349350351352353354355356357358359360
T G I F G N D A I T T G I P S D I W R F Y I Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N R P E K S D F Q F M W Q D L M E R V N T E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D N F S N L V N R V L T F Q R K F F G D V I E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I E I Q N K F W K Q I T P K Y N K I L N L F K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T E L K S A L K E I L K I S S L G N K I F Q D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E P W K R K N N S P Q E T K E L I S N L I Y L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R D L S I L M M P F I P E T S K K I Q Q F F G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S Y Q F S T K I L G T K S G I K K I E F T E I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F N K L E Q K K I N N L K L K Y S G D K N M K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
N E Q A E N L P I A K E Q P E N L F R E K V L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R V V K I N K I E R N P E A K N L F I L K L D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G T N K D K Q I V S G L E G Y Y T E E E L L G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
H I I I V D N L K P A K F R G I K S E G M L I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A E D K N K N F K V I I V E D S I Q N P I A G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R I I L E N D Q N K D L A C P P K I D I N K F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
K A N I V A E N G E L K I N G I N L I L E N S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734
N K I L S K D I P N G T V C
- - - - - - - - - - - - - -
------------------------------------------
Class I
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_met_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K N F K R T T V T S A L P Y A N G P V H I G
- - - - - - - - T V T S . L P Y A N G P V H I G
------------------------ACCGTCACATCG---CTGCCGTATGCGAACGGCCCCGTCCATATCGGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
H L A G V Y V P A D I Y V R Y L R L K K E D V L
H L A . V Y V P A D I Y V R Y - - - - - - - - L
CATTTGGCC---GTATATGTACCGGCAGACATCTATGTCCGCTAT------------------------CTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F I G G S D E H G V P I T I R A K K E G I T P Q
F I G G S D E H G - - - - - - - - - - - - - - -
TTCATCGGAGGCTCCGACGAACATGGG---------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D V V D R Y H F L I K K S F E E F G I S F D V Y
- - - D R Y H F L I K K S F E E F . . . . D V Y
---------GACCGCTATCACTTCCTGATTAAGAAATCATTCGAAGAATTC------------GACGTATAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S R T S S K T H H E L A S D F F K K L Y E K G E
S R T S S - - - - - - - - - - - - - - - - - - -
AGCCGTACATCGTCC---------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F I E K T S E Q Y Y D E E A H Q F L A D R Y I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G E C P H C H S E G A Y G D Q C E K C G T S L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P T D L I N P K S A I S G S K P V M K E T K H W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y L P L D K H E T W L R Q W I L E E H K E W R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N V Y G Q C K S W L D M G L Q P R A V S R D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
W G I P V P V E G A E G K V L Y V W F D A P I G
- - - - - - - - - - - - - - - Y V W F D A P I G
---------------------------------------------TACGTATGGTTCGATGCACCAATCGGT
265266267268269270271272273274275276277278279280281282283284285286287288
Y I S N T K E L L P D S W E T W W K D P E T R L
Y I - - - - - - - - - - - - - - - - - - - - - -
TACATA------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V H F I G K D N I V F H C I V F P A M L K A E G
V H F I G K D N I V F . C I V F P A M L K A E -
GTTCACTTTATCGGAAAAGATAATATCGTATTT---TGCATCGTATTTCCGGCTATGCTGAAAGCTGAA---
313314315316317318319320321322323324325326327328329330331332333334335336
S Y I L P D N V P S N E F L N L E G D K I S T S
- - - - P . N V P S N - - - - - - - - K I S T S
------------CCG---AATGTACCGAGCAAC------------------------AAAATATCCACTTCA
337338339340341342343344345346347348349350351352353354355356357358359360
R N W A V W L H E Y L E D F P G K Q D V L R Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L T A N A P E T K D N D F T W K D F Q A R N N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E L V A V Y G N F V N R A M V L T Q K Y F E G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V P A A G E L I D Y D K E T L K E F S D V K A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V E K L L N V F K F R D A Q K E A M N L A R I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N K Y L A D T E P W K L A K T D M E R V G T I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N I S L Q L V A N L A I A F E P F L P F S S E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L R Q M L N M D S F D W A E L G R N D L L P A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
H Q L N K P E L L F E K I E D A T I E A Q V Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L L D T K K A N E E A N Y K A K P I R A N I E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D D F M K L D I R V G T V L E C Q K V P K A D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L L Q F K I D D G L E T R T I V S G I A Q H Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
P E E L V G K Q V C F I A N L A P R K L K G I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S E G M I L S A E N N D G S L A V V M P G R E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679
K P G S E V K
- - - - - - -
---------------------
Class I
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_met_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P Q E K N T F Y I T T P I Y Y P S G K L H I G
- - - - - - - - Y I T T . I Y Y P S G K L H I G
------------------------TACATCACTACA---ATTTATTACCCAAGTGGGAAGCTACATATTGGA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
H A Y T T V A G D A M A R Y K R L R G F D V R Y
H A Y T T V A G D A M A R Y - - - - - - - - R Y
CATGCCTACACGACCGTTGCAGGTGATGCGATGGCTCGTTAT------------------------AGATAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L T G T D E H G Q K I Q Q T A E K E N I T P Q E
L T G T D E H G - - - - - - - - - - - - - - - -
TTAACTGGTACAGATGAGCACGGA------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L V D R A A E D I Q Q L W K K L D I S N D D F I
- - D R A A E D I Q Q L W K K L D - - - - D F I
------GATCGTGCGGCAGAAGACATTCAGCAGCTTTGGAAAAAGCTCGAC------------GACTTCATT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R T T E E R H K N V I E K V F Q K L L D N G D I
R T T E - - - - - - - - - - - - - - - - - - - -
CGGACGACAGAG------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y L D E Y E G W Y S I P D E T F Y T E T Q L V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V E R N E K G E V I G G K S P D S G H P V E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K E E S Y F F R M G K Y A D R L L A F Y E E N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E F I Q P E S R K N E M I N N F I K P G L E D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A V S R T T F D W G I K V P G N P K H V I Y V W
- - - - - - - - - - - - - - - - - - - - - Y V W
---------------------------------------------------------------TATGTTTGG
241242243244245246247248249250251252253254255256257258259260261262263264
I D A L F N Y I T A L G F N T A N D E N Y Q K Y
I D A L F N Y I - - - - - - - - - - - - - - - -
ATAGATGCGCTGTTTAATTACATT------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
W P A D V H L V G K E I V R F H T I Y W P I M L
- - - - V H L V G K E I V R F . T I Y W P I M L
------------GTTCATCTTGTCGGTAAGGAGATCGTCCGCTTC---ACCATTTACTGGCCGATTATGCTG
289290291292293294295296297298299300301302303304305306307308309310311312
M A L D L P L P K K V F A H G W L L M K D G K M
M A L - - - - P K . V F A H - - - - - - - - K M
ATGGCATTG------------CCGAAA---GTTTTTGCCCAC------------------------AAAATG
313314315316317318319320321322323324325326327328329330331332333334335336
S K S K G N V V D P V T L I D K Y G L D A L R Y
S K S - - - - - - - - - - - - - - - - - - - - -
TCTAAATCA---------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y L L R E V P F G S D G V F T P E G F V E R I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y D L A N D L G N L L N R T V A M V N K Y F D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R V Q S Y E G P V T A F D E Q L S S F S Q K T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E A Y E Q A I E N M E F S V A L S S L W Q F V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R T N K Y I D E T A P W V L A K D K D K E K D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q S V M Y H L A E S L R I T A V L L Q P F L T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T P E K I F A Q L G V T D A S L K T W D S I K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F G Q L K S V K V Q K G E P L F P R L E A E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V A Y I K S K M Q G T A P K E E P K Q E E K A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E R L P E I T I D D F M S T E L R V A E V I H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E P V K K A D R L L K L Q L D L G F E K R Q V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
S G I A K H Y K P E E L V G R K V I C V T N L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
P V K L R G E L S Q G M I L A G E D N G V L S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662
A A V D S S L S N G T R I K
- - - - - - - - - - - - - -
------------------------------------------
Class I
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_met_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T S A R S A A A V R E T A A P R G E C G R T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P A R T S A A G R P A R I A A S L R F S A S S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F R D P M S A S D L H P V Q A G A P Q G R R Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L V T S A L P Y A N G Q I H I G H L V E Y I Q T
L V T S . L P Y A N G Q I H I G H L V E Y I Q T
GGTCTTCTCCTC---GACGTCGAGCGTGAGCTGCAGCAGTTTGTCCGAGCCTTCGACCGCCTGGCACGCGAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D I W A R T M R M H G H E I Y Y I G A D D T H G
D I W A R T - - - - - - - - Y Y I G A D D T H G
GATCTTCGCGATGCGCAG------------------------CGAGATGAACGGCGATGCTTCGTCGTCGGC
121122123124125126127128129130131132133134135136137138139140141142143144
T P V M L R A E Q E G V S P K Q L I E R V W R E
- - - - - - - - - - - - - - - - - - E R V W R E
------------------------------------------------------CGTCGCGCCGGCCGCGTC
145146147148149150151152153154155156157158159160161162163164165166167168
H K R D F D S F G V S F D N F Y T T D S D E N R
H K R D F D S F . . . . D N F Y T T D S - - - -
GGCCGCCGCGGCGCCTTGCAGCGA------------CGCGAGGAGCGCGTCGATCTGCTT------------
169170171172173174175176177178179180181182183184185186187188189190191192
V L S E K I Y L A L K E A G F I A E R E I E Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y D P V K Q M F L P D R F I K G E C P K C H A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D Q Y G D S C E V C G T T Y Q P T D L V N P Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V V S G A T P V R K T S T H H F F R L S D P R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E A F L R E W V S G L A Q P E A T N K M R E W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G D A G E A K L A D W D I S R D A P Y F G F E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P G A P G K Y F Y V W L D A P V G Y Y A S F K N
- - - - - - - - Y V W L D A P V G Y Y - - - - -
------------------------ATTGACGCGCGCCTGGAAGTCCTCGAGGTTCAG---------------
337338339340341342343344345346347348349350351352353354355356357358359360
L C E R R G L D F D A W I S K D S T T E Q Y H F
- - - - - - - - - - - - - - - - - - - - - Y H F
---------------------------------------------------------------GTAGCTCTG
361362363364365366367368369370371372373374375376377378379380381382383384
I G K D I L Y F H T L F W P A M L E F S G H R T
I G K D I L Y F . T L F W P A M L E F S - - - -
CGCGGTGATGAACGTGCCGCGCGA---CGACATCTTCGCGCCGTCGACCGTCAGGAAGCC------------
385386387388389390391392393394395396397398399400401402403404405406407408
P T N V F A H G F L T V D G A K M S K S R G T F
P . N V F A H - - - - - - - - K M S K S - - - -
GTT---CGGCGTGCGGTGGCC------------------------GAACAGCGTGTGGAA------------
409410411412413414415416417418419420421422423424425426427428429430431432
I T A Q S Y I D A G L N P E W L R Y Y F A A K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N A T M E D I D L N L E D F Q A R V N S D L V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K Y V N I A S R A A G F L I K R F D G R V Q A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A T N H P L L V T L R D A I P Q I A A H Y E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E Y G R A L R Q T M E L A D A V N G Y V D T A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P W E L A K D P A N A V A L H E T C T V S L E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F R L L S L A L K P V L P R V A E G V E A F L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I A P L T W A D A N K P L S S E Q P I R A Y Q H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L M T R V D P K Q I D A L L A A N R S S L Q G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A A A D A A G A T N G N G A K A A K S A K A A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A A S A D D E A S P F I S I D D F A K I D L R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A K I V A C Q A V E G S D K L L Q L T L D V G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E K T R N V F S G I K S A Y Q P E Q L V G K L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
V M V A N L A P R K M K F G L S E G M V L A A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A A D E K A E P G L Y I L E P H S G A K P G M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770
V K
- -
------
Class I
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_met_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q N P P Q H P E A Q S P E T R D R E F F I T A
- - - - - - - - - - - - - - - - - - - - F I T A
------------------------------------------------------------TTCATCACCGCC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A I D Y A N G T P H I G H V Y E K I L A D A I A
. I D Y A N G T P H I G H V Y E K I L A D A I A
---ATCGACTATGCCAACGGCACCCCGCACATCGGGCACGTCTACGAAAAGATTCTGGCCGACGCGATTGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R Y Q R L A G R D V T F V M G T D E H G E K I S
R Y - - - - - - - - T F V M G T D E H G - - - -
CGTTAC------------------------ACGTTTGTGATGGGCACCGACGAGCACGGC------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K A A A K G G V T P Q E L V D D L S E R A F Q G
- - - - - - - - - - - - - - D D L S E . A F Q G
------------------------------------------GACGACCTCTCGGAG---GCCTTTCAGGGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L W K K L G I S Y D F F I R T T S A K H K K Y V
L W K K L . . . . D F F I R T T S - - - - - - -
CTGTGGAAAAAGCTC------------GACTTTTTTATCCGCACCACCTCG---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q D V L Q R V Y D A G D I Y F A E Y E G L Y S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G A E R Y V T E K E L V E G P D G V R R F P G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K D P P E L R R E A N Y F F N M Q K Y Q P W L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E T L Q Q N P D L I Q P A G Y R N E V L E M L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E D I G P L S I S R P K A R V P W G I E L P W D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T D H V T Y V W F D A L L S Y L T P L V S Q G Q
- - - - - Y V W F D A L L S Y L - - - - - - - -
---------------TACGTGTGGTTCGATGCGCTGCTGAGCTACCTG------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D A S M S G K A W H V I G K D I L K P H A V F W
- - - - - - - - W H V I G K D I L K P . A V F W
------------------------TGGCACGTCATCGGCAAGGACATCCTCAAGCCG---GCGGTGTTCTGG
289290291292293294295296297298299300301302303304305306307308309310311312
P T M L R A A G L P L Y R R L V V H S H I L A E
P T M L R A A - - - - Y R . L V V H - - - - - -
CCGACCATGCTGCGCGCCGCC------------TACCGC---TTGGTGGTGCAC------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D G R K M G K S L G N A I D P E E L V A A W P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D A I R Y A L L R E A S L G A D S P F G E G V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V S R L N S D L A N D L G N L L S R T V S M I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K Y R G G V I P A A T E P T D R E R E I E A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R A L P D E V L R L V D E L K I N M A I D A A M
- - - - - - - - - - - - - - K . . . . . . . . M
------------------------------------------AAA------------------------ATG
433434435436437438439440441442443444445446447448449450451452453454455456
S F V R D L N R Y I A E S T P W T L A K S P E T
S . . . . . . . . . . . . . . . . . . K S - - -
AGC------------------------------------------------------AAGTCG---------
457458459460461462463464465466467468469470471472473474475476477478479480
Q G R L D T V L Y T A A E G L R V A S V A L E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V I P T K A K E L R E Q L G L G R Q G Y P L Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A W G L T P A G T R V Q G G A I L F P K P E P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A D E T K N A E A K P P K P Q A K K E K K T V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D T A P A K T T E Q K P E A A A P A Q N D G L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
S I D D F A K I D L R I A E V V A C E A V E K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D K L L K L T V K L G D E T R T V V S G I R K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y E P E A L V G R K V V L V A N L K P A K L R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I E S Q G M I L A A E D D A G N L D L V G T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681
D L P S G T K V R
- - - - - - - - -
---------------------------
Class I
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_met_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K K T F Y L T T P I Y Y P S D K L H I G H A
- - - - - - Y L T T . I Y Y P S D K L H I G H A
------------------TATTTGACGACG---ATTTATTACCCAAGCGACAAATTGCACATTGGCCATGCT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y T T V A G D A M A R Y K R L R G Y D V M Y L T
Y T T V A G D A M A R Y - - - - - - - - M Y L T
TATACGACCGTGGCGGGGGATGCGATGGCTCGCTAT------------------------ATGTATTTGACC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G T D E H G Q K I Q R K A Q E K G V T P Q Q Y V
G T D E H G - - - - - - - - - - - - - - - - - -
GGAACGGACGAACATGGG------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D D I V A G I Q E L W R K L D I S Y D D F I R T
D D I V A G I Q E L W R K L D - - - - D F I R T
GACGACATTGTCGCCGGCATCCAAGAGTTGTGGAGAAAACTGGAC------------GATTTTATCCGGACG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T Q E R H K K I V E K I F A R L V E Q G D I Y L
T Q - - - - - - - - - - - - - - - - - - - - - -
ACACAG------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G E Y E G W Y C T P C E S F Y T E R Q L V D G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
C P D C G R P V E K V K E E S Y F F R M S K Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D R L L Q Y Y E E N P D F I Q P E S R K N E M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N N F I K P G L E D L A V S R T T F D W G I K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P G D P K H V I Y V W I D A L A N Y I T A L G Y
- - - - - - - - Y V W I D A L A N Y I - - - - -
------------------------TACGTCTGGATCGATGCGCTGGCCAACTACATC---------------
241242243244245246247248249250251252253254255256257258259260261262263264
G T D N D E K F R K Y W P A D V H L V G K E I V
- - - - - - - - - - - - - - - V H L V G K E I V
---------------------------------------------GTCCATCTCGTCGGCAAGGAGATCGTC
265266267268269270271272273274275276277278279280281282283284285286287288
R F H T I Y W P I M L M A L G L P L P K K V F G
R F . T I Y W P I M L M A L - - - - P K . V F G
CGCTTC---ACGATTTACTGGCCGATCATGCTGATGGCGCTC------------CCGAAA---GTGTTCGGA
289290291292293294295296297298299300301302303304305306307308309310311312
H G W L L M K D G K M S K S K G N V V D P V M I
H - - - - - - - - K M S K S - - - - - - - - - -
CAT------------------------AAAATGTCGAAATCG------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I D R Y G L D A L R Y Y L L R E V P F G S D G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F T P E G F I E R I N Y D L A N D L G N L L H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T V A M I E K Y F G G A I P P Y R G P K T P F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R D L S E T A R E V V R Q Y E E A M E R M E F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V A L S A V W Q L I G R T N K Y I D E T Q P W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L A K E E S K R E E L A S V M A H L A E S L R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T A V L L Q P F L T R T P E R I F T Q L G I S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R S L K E W D S L Y D F G L I P E G T N V Q K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E P L F P R L D I G V E V E Y I K A H M Q G G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P A E A A K E E K Q A A R A E E I S I D D F A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V D L R V A E V V H A E R M K N A D K L L K L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L D L G G E K R Q V I S G I A E F Y K P E E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G K K V I C V A N L K P A K L R G E W S E G M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L A G G S G D G F S L A T V D Q H V P N G T K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649
K
-
---
Class I
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_met_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K E Q T V T D K P R W F Q T T A I D Y P N S R
- - - - - - - - - - - - F Q T T . I D Y P N S R
------------------------------------TGCAACCAACTC---CGTGATGCGCAGGTCGTCGGG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P H I G T A F E K L G A D V Q A R Y R R M E G F
P H I G T A F E K L G A D V Q A R Y - - - - - -
TTGGGCCTTCAGTGCGATCGCGTCCGCGTACTTCACTTCGGCCCACGGGGTCGG------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V F F L M G N D E N T V K V S K R A A E L G Q
- - F F L M G N D E N T - - - - - - - - - - - -
------CTCCGCGCTCTTGGGGATGAACGGCTTCAG------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D T Q V Y C D D M A R Q F R E V W A A L D I S Y
- - - - - - D D M A R Q F R E V W A A L D - - -
------------------CGCGTCCTTGTCCGTCTTCACGAGTTTCCACGGAGCGTTCGCTTC---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D T F V Q T S S E R H K Q C C R K F I Q K V Y D
- T F V Q T S S - - - - - - - - - - - - - - - -
---CGTCGGCGTGAGGAAGTCCTG------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N G H I Y K G S Y E G W Y C D G C E E F K S D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V R D E N A G N C P V H K R P L T R R S E P C Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L F R L S A F Q D R L L A H Y K E N P D F I Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E S R R N E M I S L I E T E G L R D I N I S R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G E D W G I R I P F D P E F T I Y V W F D A L L
- - - - - - - - - - - - - - - - Y V W F D A L L
------------------------------------------------GAAGTTCACGAACCCGTGGCTGAA
241242243244245246247248249250251252253254255256257258259260261262263264
T Y I T G I G Y G D D E A T F R K H W P C D T H
T Y I - - - - - - - - - - - - - - - - - - - T H
CACCTTCTT---------------------------------------------------------GGTGAT
265266267268269270271272273274275276277278279280281282283284285286287288
F I G K D I T R F H C A L W P A M L W A A G E E
F I G K D I T R F . C A L W P A M L W A A - - -
GTCCTTACCGATAAAGTGCGTGTCGCA---CCAGTGTTTGCGGAACGTCGCTTCGTCGTCGCC---------
289290291292293294295296297298299300301302303304305306307308309310311312
A P K K V F S H G F V N F E G K I G K S R E E E
- P K . V F S H - - - - - - - K I G K S - - - -
---GGTGAT---CGTGAGCAGCGC---------------------GAACTCCGGGTCGAA------------
313314315316317318319320321322323324325326327328329330331332333334335336
L R A R G L D Y L L E P M L I I Q R F S A E A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R Y Y F M R E C P Y P S D G E I S P E R F M E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y N S E L A N N L G N L F S R E M T I T W K N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G G V F D G T A G Q V P D P V V P G L N L E L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V G E V R E H I E A C R Y H L A L Q K I V Q D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L T P T N Q Y L E A N A P W K L V K T D K D A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K K V L F N A V Q S L R V A S I L L K P F I P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S A E T I Y T S F N F P T P W A E V K Y A D A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A L K A Q P D D L R I T A E L V A D K V K P L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532
P R I G
- - - -
------------
Class I
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_met_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N F A D R S K D T F A V T T P L Y Y V N D L P
- - - - - - - - - - - A V T T . L Y Y V N D L P
---------------------------------CACTGGTCTAGG---CCCCAATTGTTGTATATCGCTCAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
H I G S A Y P T M A A D A L A R F E R L L G K S
H I G S A Y P T M A A D A L A R F - - - - - - -
TATCCCCCAATTTGAGTGACTACTGAATGGAGTGGTAATGAAAGTTTGAGC---------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L M I T G T D E H G Q K I Q R A A E S H G R S
- L M I T G T D E H G - - - - - - - - - - - - -
---TCCTAATTGCTGATAAATTTCGGTGCAAGT---------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P Q E Y C D R I S S S F V S L W E L L N I Q Y D
- - - - - D R I S S S F V S L W E L L . . . . D
---------------AGCATACAATACTTCCTCCACTTCTGTCTGTCGCTTTTGTTT------------CGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R F S R T T A T Q H E A I V K E F F G R V W D A
R F S R T T A - - - - - - - - - - - - - - - - -
GGCTTTCTCATCAATGAATTT---------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G D I Y S D R Q Q G W Y C V S C E E F K E E R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L L E G N Y C P L H P N K Q V E W R D E Q N Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F R L S R Y Q E Q L E A H Y Q K Y P D F I Q P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S R R N E V L N F V S Q G L Q D F S I S R V N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D W G F P V P V A P E Q T L Y V W F D A L L G Y
- - - - - - - - - - - - - - Y V W F D A L L G Y
------------------------------------------GGTTAAAAAGCCGTGTCCGAAAACTCGCCC
241242243244245246247248249250251252253254255256257258259260261262263264
V T A L L D P D S E A T L E N A L A Q W W P I N
V - - - - - - - - - - - - - - - - - - - - - - -
TGG---------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I H I I G K D I L R F H A V Y W P A M L M S A G
I H I I G K D I L R F . A V Y W P A M L M S A -
GATAATGTGTATGTTAATGGGCCACCATTGAGC---AGCATTTTCCAAAGTTGCTTCGCTGTCAGGATC---
289290291292293294295296297298299300301302303304305306307308309310311312
L P L P G R V F G H G F L T K D G Q K M G K T M
- - - P . R V F G H - - - - - - - - K M G K T -
---------CAC---TCCTAACAATGCATC------------------------TGGCGCGACGGGAAC---
313314315316317318319320321322323324325326327328329330331332333334335336
G N T I D P V A L V K Q Y G S D A V R Y Y F L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T I E F G K D G D F S E T R F I N T V N A D L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D N L G N L L N R T L S M V R K Y C A G K V P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V G E V A A E H P L K A I A T S L G Q E V K Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y E V L A F D R A C E A I L D L V R A S N K F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D E K A P W S L Y K Q K R Q T E V E E V L Y A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L E S V R L A A Y L L A P I I P H T C T E I Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q L G F A I D F N H K A Q T F I T T P F S S H S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
N W G I L S D I Q Q L G E P R P V F Q R I E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531
Q K V
- - -
---------
Class I
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_met_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S Q Q A N P N R Y T I T A A L P Y A N G P I H
- - - - - - - - - - T I T A . L P Y A N G P I H
------------------------------ATTTTCAATACG---AAAAAGCAAAGTTGGAGCTGGCAATAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I G H L A G V Y I P A D I Y A R Y L R S K K K E
I G H L A . V Y I P A D I Y A R Y - - - - - - -
AGTTCCTGGCTTAAT---CTCCATACTACCTGCATTGTCCCAATCTAGATT---------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V I F I S G S D E H G V P I T I R A Q Q E G I T
- I F I S G S D E H G - - - - - - - - - - - - -
---CTTCTGGCTGGTAAAAGGCAAAAAGGGTGC---------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P Q Q I V D K Y H H L N K Q N L Q D L G I S F D
- - - - - D K Y H H L N K Q N L Q D L . . . . D
---------------CACCTGTTCTGGCATGGTTTTGATTAAATGCCAAGGTGCTGT------------CTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I F S R T S S E V H H Q T A S D F F T T L Y N K
I F S R T S S - - - - - - - - - - - - - - - - -
ATTGCCTGCTCTAGCTAGATC---------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G I L I A K E T E Q Y Y D P A S H Q F L A D R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I R G T C P K C G Y T D A Y G D Q C E V C G T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L S P E E L I D P R S A L S G E T P I L K A T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
H W Y L P L D K Y E N W L K H W I L E T H T D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K S N V Y G Q C K S W L E Q G L Q P R A V T R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L D W G V P V P L P E A Y H K V L Y V W F D A P
- - - - - - - - - - - - - - - - - Y V W F D A P
---------------------------------------------------ATTATCTTTACCCACAAAATG
265266267268269270271272273274275276277278279280281282283284285286287288
I G Y I S A T K E W A I E N N Q N W E P F W K D
I G Y I - - - - - - - - - - - - - - - - - - - -
CACTAGCTTGGT------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S T T K L V H F V G K D N I V F H C I I F P V M
- - - - - V H F V G K D N I V F . C I I F P V M
---------------GATAGGTGCATCAAACCACACATATAGCACTTT---GTAAGCTTCTGGTAACGGCAC
313314315316317318319320321322323324325326327328329330331332333334335336
L Q A H E G Y I L P E Q V P A N E F M N L A G G
L Q A H - - - - - P . Q V P A N - - - - - - - -
AGGAACTCCCCA---------------TAC---ACGAGGCTGTAAACC------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K I S T S R N H A V W L H E Y L E N F K G Q Q D
K I S T S - - - - - - - - - - - - - - - - - - -
TCCATATACATTAGA---------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V L R Y V L C V N A P E A K D S D F T W Q D F Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A K N N N E L V A T L G N F V N R T L V L I Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y Y A G I V P E M T S L I H T D Q A I I I Q M Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E A A D S I G Q S I E K Y R F K E A I Q K W M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L A R A G N K Y L A D T A P W H L I K T M P E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V Q T I L N I S L Q L T A H I A I L G A P F L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F T S Q K L S Q M L L L D N L D W D N A G S M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I I K P G T L L P A P T L L F E R I E N E K I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557
Q E Q S H
- - - - -
---------------
Class I
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_met_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
K R S F R V Y S D Y C R N N L T Y N K M T K I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T T Y R N S S G K Y Y Y F T T A I N Y T N G T P
- - - - - - - - - - - Y F T T . I N Y T N G T P
---------------------------------TACTTCACGACT---ATAAACTATACTAATGGAACACCG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H M G H A Y E I V T S D I L V R I A R L F G F N
H M G H A Y E I V T S D I L V R I - - - - - - -
CATATGGGGCACGCATATGAAATAGTAACTTCTGATATTCTTGTTAGAATT---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T R F Q T G T D E H G Q K I A A T A E K K G I S
- R F Q T G T D E H G - - - - - - - - - - - - -
---AGATTTCAAACAGGAACTGATGAACATGGG---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P K E L C D E N V K Q F K N M N E K L Q I S T D
- - - - - D E N V K Q F K N M N E K L . . . . D
---------------GATGAAAATGTAAAACAATTTAAAAATATGAATGAAAAACTT------------GAC
121122123124125126127128129130131132133134135136137138139140141142143144
R F I R T T D A D H Y E S C K E L W R R C E A K
R F I R T T D - - - - - - - - - - - - - - - - -
AGGTTTATTAGAACAACTGAT---------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G D I Y L G K Y N G W Y N V R E E S F M T E L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A K M L N Y T D P I S G L P L T K M E E P S Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F R I T N Y L E S I K N H I I D N P E F I Q P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S S R E S I L A R L E A L G S D S E D L S I S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A S F S W G V P V P N D Q E H V M Y V W F D A L
- - - - - - - - - - - - - - - - - Y V W F D A L
---------------------------------------------------TATGTTTGGTTTGATGCTCTA
265266267268269270271272273274275276277278279280281282283284285286287288
T N Y I T G L K W A D F D N D L E E N S L F N K
T N Y I - - - - - - - - - - - - - - - - - - - -
ACAAATTATATT------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y W E N T V H I V G K D I T W F H S V I W P A M
- - - - - V H I V G K D I T W F . S V I W P A M
---------------GTTCATATCGTTGGTAAAGACATTACTTGGTTC---TCCGTAATCTGGCCTGCGATG
313314315316317318319320321322323324325326327328329330331332333334335336
L L S V G L S L P K T I F A H G F V T A P D G K
L L S V - - - - P . T I F A H - - - - - - - - -
CTATTAAGTGTC------------CCA---ACGATTTTTGCTCAT---------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K M S K S L G N V V D P F E Q I D K I G S D P F
K M S K S - - - - - - - - - - - - - - - - - - -
AAAATGAGTAAGAGC---------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R Y Y L A R E G R F G N D I K Y Q P S S V I D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N N G E L A D T Y G N L I S R I T N L T H K F C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q G V A P S L S Q S L L L D K P V D I D T V F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E Y Y L A W N C F R I D E C I Q I A M D L S R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I N K F L T D H A P W N K D N G K S D E E R I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I I R I V L E G S Y Y I S I L L S P F I T L A C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K E V F N R L G T P E K I I P E V D I N Y N N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K P G T P I L I G E P L F K R I V N K E E K T F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E E L K A E K R E R E K Q R R S G N K K L S E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581
K D K G K
- - - - -
---------------
Class I
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_met_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A A L H T S R E A L L A A Y P L H A S R K I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W S S W N L L R L R T Q G T R V N A E P H M G S
- - - - - - - R L R T . G T R V N A E P H M G S
---------------------AGGCTGAGAACA---GGAACGCGGGTGAATGCAGAGCCGCACATGGGCAGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A Y T T M A A D A I T R F Q R L R G K R V S F V
A Y T T M A A D A I T R F - - - - - - - - S F V
GCTTACACCACCATGGCAGCAGATGCCATTACCAGGTTT------------------------AGCTTTGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T G T D E H G E K I A E A A A K K G Q E P Q Q H
T G T D E H G - - - - - - - - - - - - - - - - -
ACCGGGACGGATGAACATGGA---------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C D G V V A S F K G L W E E M D I Q Y D S F I R
- D G V V A S F K G L W E E M D - - - - S F I R
---GATGGAGTCGTGGCATCTTTCAAGGGCCTGTGGGAGGAGATGGAC------------AGCTTCATTCGC
121122123124125126127128129130131132133134135136137138139140141142143144
T T D P K H A T V V R A I L D R V W E K G D I Y
T T D - - - - - - - - - - - - - - - - - - - - -
ACTACAGAC---------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K A K Y E G W Y C V G C E A Y K D D S E M E G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
H A C P F H K T R C V E R E E E N Y F F A L S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y Q Q Q I Q R V I E E D K S F V Q P A A R R N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V L G W V E A G L R D F S I S R A A V S W G I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I P R D P A Q T V Y V W F D A L L G Y M S A L L
- - - - - - - - - Y V W F D A L L G Y M - - - -
---------------------------TACGTTTGGTTCGACGCCCTCCTCGGCTACATG------------
265266267268269270271272273274275276277278279280281282283284285286287288
P E G A S P D E A E L A A R G W P A D V H L V G
- - - - - - - - - - - - - - - - - - - V H L V G
---------------------------------------------------------GTGCACCTGGTGGGC
289290291292293294295296297298299300301302303304305306307308309310311312
K D I L R F H A L Y W P G M L L S A G L P L P R
K D I L R F . A L Y W P G M L L S A - - - - P .
AAGGACATTCTGCGCTTC---GCCCTCTACTGGCCCGGCATGCTCCTCTCCGCC------------CCC---
313314315316317318319320321322323324325326327328329330331332333334335336
K I F A H G F L T K D G M K M G K S L G N I L E
K I F A H - - - - - - - - K M . . S . . . . . .
AAGATCTTCGCACAC------------------------AAGATG------TCC------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P R K L L A A Y G S D A V R F Y F L K E V V F G
. . K . . . . . . S - - - - - - - - - - - - - -
------AAG------------------TCC------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q D G D F S E Q R F R D T V N A F L A N S V G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L L N R T L G L L R K N C A G S L P L A A A A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P A D N P L R A V A E L E V A A A A L A Y E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R L H D A L E A V V A I A G R G N L Y M E Q M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P W T A F K K G T D E E K R A A E L A L V A V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E A V R I V A V L L S P V T P R L S S E I Y G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L G Y G P E A Y E G L S W G D A S W G G L P K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Q A T P P P K P V F A R L E G D F V T E V A A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559
K S A A V A A
- - - - - - -
---------------------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_met_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L K F F T E K A N H Q A L K A V L C A M F V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K P L E V T L G S T Y S T P Y L Q L P K S R A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L Y S C N E A A R L L W N T H A A P S P A D N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L E G E A E W L E W E S T V L T P A L T P L Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q R R I T G E A E V A L K K L D S T I E E H Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T V A V K G A P S S T S F L V D S V L F A S L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P A L C E G G L L P A A Q A A R V P H L V K W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q V F Q A E H A E L I A S A F D V L S V Q E C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D F L R V P Q T Y E V S P K K Q K V F F A T T P
- - - - - - - - - - - - - - - - - - - F A T T .
---------------------------------------------------------TTCGCCACGACG---
217218219220221222223224225226227228229230231232233234235236237238239240
I Y Y V N A S P H I G H V Y S T L I V D V L G R
I Y Y V N A S P H I G H V Y S T L I V D V L G R
ATCTACTACGTGAACGCGTCGCCACACATCGGCCACGTCTACAGCACGCTCATCGTCGACGTTCTCGGCCGC
241242243244245246247248249250251252253254255256257258259260261262263264
Y H R V K G E E V F V M T G T D E H G Q K V A E
Y - - - - - - - - F V M T G T D E H G - - - - -
TAT------------------------TTTGTGATGACGGGCACGGACGAGCACGGC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
A A A K Q G V S P M D F T T S V S S E F K Q C F
- - - - - - - - - - - - - T S V S S E F K Q C F
---------------------------------------ACGAGCGTGTCGAGCGAGTTTAAGCAGTGTTTC
289290291292293294295296297298299300301302303304305306307308309310311312
K E M N Y D M N Y F I R T T N P T H E K L V Q D
K E M N - - - - Y F I R T T N - - - - - - - - -
AAGGAGATGAAT------------TACTTCATCCGCACGACGAAC---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I W K K L E A K G D I Y L G K Y E G W Y S V S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E S F L T A Q N V A D G V D K D G K P C K V S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E S G H V V T W V E E E N Y M F R L S A F R E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L L K Y F H D H P N C I V P E F R R R E V I K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V E K G L F D L S I S R K R E S V M N W S I P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P G D E R H C I Y V W L D A L F N Y Y T G A L T
- - - - - - - - Y V W L D A L F N Y Y - - - - -
------------------------TACGTGTGGCTGGATGCCCTCTTCAACTACTAC---------------
457458459460461462463464465466467468469470471472473474475476477478479480
R V A A D G T E T L D E D H H T L N R W P A D V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GTG
481482483484485486487488489490491492493494495496497498499500501502503504
H V V G K D I L K F H A I Y W P A F L M S A E L
H V V G K D I L K F . A I Y W P A F L M S A - -
CACGTGGTCGGCAAGGACATCCTCAAGTTT---GCCATTTACTGGCCAGCCTTCCTGATGTCCGCG------
505506507508509510511512513514515516517518519520521522523524525526527528
P L P E R L V S H G W W T K D R R K I S K S L G
- - P . R L V S H - - - - - - - - K I S K S - -
------CCG---CGGCTGGTGTCGCAT------------------------AAGATCAGCAAGTCG------
529530531532533534535536537538539540541542543544545546547548549550551552
N A F D P V E K A K E F G I D A L K Y F L M R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
S N F Q D D G D Y S D K N M V A R L N G E L A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
T L G N L V S R C V A P K I N V N G M W P E P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E Y S E S D K T L I A S L N N L A G T V D H Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
C L P D I Q H A L I A I F D V L R S L N A Y V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E N A P W K L V K T D T A R L G T V L Y V T M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G L R I C T M F L Q P V M P Q K A K E I M D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G V P E A A R V D M E N Y L F G I V K P R T K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A G L A E G Q V I F Q K V T L P T E E G E R I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747
E G Q
- - -
---------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_met_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T Y T V T T P L Y Y V N D R P H L G S A Y T T
- - - - V T T P L Y Y V N D R P H L G S A Y T T
------------GTCACCACACCACTCTATTACGTTAATGATCGTCCTCATTTAGGAAGTGCTTATACAACT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A C D A L A R Y Q R L I G K S V V F I T G C D
L A C D A L A R Y Q R L I G . . . . . . . . C D
TTAGCTTGTGATGCATTAGCACGCTATCAACGGCTAATAGGA------------------------TGTGAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E H G Q K I Q R T A E A A S L K P Q E S C N Q V
E H G - - - - - - - - - - - - - - Q . . . . Q V
GAACATGGT------------------------------------------CAG------------CAAGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S E E Y H H L W S R W Q I S N D R F I R T T D L
S E E Y H H L W S R W . . . . D R F I R T T D -
AGTGAAGAATATCATCATCTTTGGAGCCGTTGG------------GATCGTTTTATTCGTACTACCGAT---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R H Q A I V K E F F L R V E K A G D I L E G Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q G W Y C V A C E E F K D E P V D A E G D N Q C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A I H Q R R L E W R D E P N L F F N L S R Y Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q I E E L I Q K P G F I L P V S R R R E I E N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V A Q G L H N F S I S R I N L P W G I P V P G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T D H T F Y V W F D A L I G Y L T A L L E P S D
- - - - - Y V W F D A L I G Y L - - - - - - - -
---------------TATGTTTGGTTTGATGCGCTTATTGGGTATTTA------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P P E L D I I L R R G W P A N V H V I G K D I L
- - - - - - - - - - - - - - - V H V I G K D I L
---------------------------------------------GTACACGTTATAGGTAAAGACATTCTT
265266267268269270271272273274275276277278279280281282283284285286287288
R F H A V Y W P A M L M S A G L E V P D M V F G
R F . A V Y W P A M L M S A - - - - P . M V F G
AGATTT---GCTGTATATTGGCCAGCAATGCTAATGTCAGCT------------CCA---ATGGTTTTTGGC
289290291292293294295296297298299300301302303304305306307308309310311312
H G F L T R E G K K M G K S L G N I L D P E L L
H - - - - - - - - K M G K S - - - - - - - - - -
CAT------------------------AAAATGGGAAAATCA------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L E E Y G R D S V R W Y L L R D I P F G E D G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F Q K K R F I D L I N N D L S N T I G N L L N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T L S M A R R W F A N A V P D C R E A V T D Q H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S L A K A S Q S A I L I N I T A L D K L E F R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A A E A T L D L A A Q A N T F L S E Q A P W S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I K Q E G G R E Q V G A D L Y A V L E T T R I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S L L L I P L I P E L S I R L Q K Q L G L K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L D G A K V S P K G I T W E S S L S W G Q L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524
G S H L P E P I P V M A R L E N N T N D
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_met_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_met_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K K V P S K K I I T S A L P Y V N N Q P H L
- - - - - - - - - I I T S . L P Y V N N Q P H L
---------------------------ATAATTACAAGT---CTGCCATACGTTAACAACCAGCCACATTTA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G N I I G C V L S A D M Y A R F C R K N N E D V
G N I I . C V L S A D M Y A R F - - - - - - - -
GGTAATATCATA---TGCGTGTTAAGTGCCGATATGTATGCAAGATTT------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V F L S G T D E Y G T A I E M A A F A Q N K T P
V F L S G T D E Y G - - - - - - - - - - - - - -
GTTTTTTTGTCTGGTACTGACGAATATGGA------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L Q I C E E N R I I H K K I Y D W F N I D F D F
- - - - E E N R I I H K K I Y D W F . . D - - F
------------GAAGAAAACAGAATTATACATAAAAAAATTTATGACTGGTTT------GAT------TTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F G H T T S T A H T K N V Q D F F N K I H N N G
F G H T T S - - - - - - - - - - - - - - - - - -
TTTGGACATACAACAAGC------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F F T E Q E I E Q F F C D K C Q I F L A D R Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V G T C K F C K Y T D A K G D Q C D G C G H T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K S L D L I D A K C T L C H S F P N I K S T R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L F F D F N N F K D K L Q K L F N T N S Q Y W S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E N G K Q I T K S W L D Q E L L P R C M T R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K N R W G V P V P L K D F E E K V F Y V W F D A
- - - - - - - - - - - - - - - - - - Y V W F D A
------------------------------------------------------TATGTTTGGTTCGATGCA
265266267268269270271272273274275276277278279280281282283284285286287288
V I G Y F T F Y K E Y V A A R S E S K E L D K N
V I G Y F - - - - - - - - - - - - - - - - - - -
GTTATAGGATATTTT---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N V F A T D N I L Q D C E L V Q F M G K D N V F
- - - - - - - - - - - - - - V Q F M G K D N V F
------------------------------------------GTTCAGTTTATGGGTAAAGATAATGTATTT
313314315316317318319320321322323324325326327328329330331332333334335336
F H T I V F P S L I F A T N D S Y P L I K K L S
F . T I V F P S L I F A T - - - - - - I K . L S
TTT---ACAATTGTATTTCCATCTTTAATATTTGCTACT------------------ATAAAA---CTGTCA
337338339340341342343344345346347348349350351352353354355356357358359360
V T E F L L F E N E K F S K S R G H G I F G L D
V T - - - - - - - - K F S K S - - - - - - - - -
GTTACT------------------------AAGTTTTCAAAAAGC---------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L V D N T M G Q S C L W R Y Y L A K I R P E K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D S N F S F T H F T N V I D A D L N N N I G N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
C N R V L K Y I K N K N D K L I S I D K L E H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D D L M V Q T I D K I Y K E Y L T S F S A I R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R E A L E K I L E I S K V G N E Y V Q Q V V S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K I E V P K G F Q V A F S I V V L I G Q L L E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F I P V S S E K L L K M C N R K K E N F C E S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y I I K S A E I G D D I K P L F N K L D D S L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560
E R I K N F K K
- - - - - - - -
------------------------
Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_trp_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E G E K S Y K L D P W A S A V K L E Y D K L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R Y F G I K P F Q E L L P R V S Q V F G E P L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L M K R G V I F G H R D Y E T I L D A Y K S G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R I A L V T G F M P S G K F H F G H K M V A D Q
- - A L V T G F M P S G K F H F G H K M V A D Q
------GATTCCTCCCAGCCTACGCTGCTCCTCGACAGTAGCTCTTCCGCCAGTTAATGCACGCTTAAGCTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I I Y Y Q K L G F E V F I V I A D A E A Y A V R
I I Y Y Q K . . . E V F I V I A D A E . . . V -
GCGAACAGCAACATCTAC---------TAGGAATATCGTATAGTCTGGCCTAGAGCT---------GTT---
121122123124125126127128129130131132133134135136137138139140141142143144
K L D R K K V I E I G L Y E Y V A N L I A L G L
- - - - - - - I E I G L Y . Y V A N L I A L . .
---------------------GTGATAGGTGGACGCTGG---CCTTAGCCCTAGCTCGTTCTCAAA------
145146147148149150151152153154155156157158159160161162163164165166167168
E K N K H T H I Y F Q T N Y E K P Y Y R L I Q M
. . . . . T H I Y F Q T N - - - - - - - - - - -
---------------GAACCTAATATGAGGGTCTTGGTC---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F S R K I T M A E M E A I Y G D L E P G K V V A
- - - - - - - - - - - - - - - - - - - - - - V A
------------------------------------------------------------------TGGCTC
193194195196197198199200201202203204205206207208209210211212213214215216
A L T Q A A D I L H P Q L E Y F G G F K Y V L V
A L T Q A A D I L - - - - - - - - - - - - - L V
TAGATCACCATAGATAGCTTCCATTTC---------------------------------------GTAGTA
217218219220221222223224225226227228229230231232233234235236237238239240
P V G A D Q D P H I R F T R D I A D R F E N E L
P V G A D Q D P H I R F T R D I A D R F - - - -
TGGCTTCTCATAGTTAGTCTGGAAGTATATATGGGTATGTTTGTTCTTCTCAAGTCCTAG------------
241242243244245246247248249250251252253254255256257258259260261262263264
G L R R P A S T Y H R F Q T G L D G N K M S S S
- - - R P A S T Y - - - - - - - - - - K M S S S
---------CTCGTACAGTCCTATTTC------------------------------AGCATATGCTTCCGC
265266267268269270271272273274275276277278279280281282283284285286287288
R P D Y T I F L T D P V D V A V R K L K R A L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G G R A T V E E Q R R L G G I P E K C T I Y E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y V Y H L L R D D R E L V R I Y N E C K Q G S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L C G P D K Q Y A A E L L A K F L E E H Q K R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376
E K A R D R V L E Y V E P P E F
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_trp_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A Q D F T V T P W E V K G K V D Y D K L I V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F G T Q K M T S E L K E R A K R A I N D E L H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M L R R D V F F S H R D F D L I L N D Y E K G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G F F L Y T G R A P S L G M H I G H L I P F I F
- - F L Y T G R A P S L G M H I G H L I P F I F
------GAGCCACTGAAAAGCAACGTCTATATCTGGATTTCCGCCGTATTTCCTGTGAAGTTCCACTGTAGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T K W L Q E K F K V N V Y I E I T D D E K F L R
T K W L Q E . . . . N V Y I E I T D D E . . . .
TTGCCCACCAGAAAATGC------------TTTTCTCTCAACAGTTTTAGGATCATCTGT------------
121122123124125126127128129130131132133134135136137138139140141142143144
N V D Y T L D Q T K E W S Y E N I L D I I A V G
. . . . T - - - - K E W S Y E N I L D I I A V .
------------TGA------------TCCTTCTGGTCCTGTAAGAGGAGGGAGGAACTTACTATGTAT---
145146147148149150151152153154155156157158159160161162163164165166167168
F D P N K T F I F Q D T E Y I K N M Y P L S V K
. . . . . T F I F Q D T E - - - - - - - - - - -
---------------CCCTAAGCTTTCAGCTATATCTCT---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V A K K L T F N E V R A T F G L D T S S N I G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I F Y P A L Q I V P T M F E K R R C L I P A G I
- F Y P A L Q I V P T M - - - - - - L I P A G I
---ATTGGAGGAAGTATCAAGTCCAAATGTAGCTCT------------------TTTTTTAGCAACTTTTAC
217218219220221222223224225226227228229230231232233234235236237238239240
D Q D P Y W R L Q R D I A E S L G Y F K A A Q I
D Q D P Y W R L Q R D I A E S L - - - K A A Q I
GGACAGTGGGTACATATTTTTAATGTACTCAGTGTCCTGGAATATGAA---------GGGATCGAACCCAAC
241242243244245246247248249250251252253254255256257258259260261262263264
H S K F L P P L T G P E G K M S S S Q P E T A I
H - - - - - - - - - - - - K M S S S - - - - - -
AGC------------------------------------TGTCTGATCCAATGT------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y L T D D P K T V E R K I M K Y A F S G G Q A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V E L H R K Y G G N P D I D V A F Q W L Y M F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E P D D Q R I R K I E E D Y R S G A M L T G E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K Q I L V D K L D A F L E E H R E K R E K A K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381
L V N V F K F D G D L A R D M W K R I H V
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_trp_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D P W D V E E V D Y E R L T E E F G I R P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D E K V R E L L P R R F P L L D R G I V F G H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D Y D S F L K D Y N D G K L V S V L S G M M P S
- - - - - - - - - - - - - - - S V L S G M M P S
---------------------------------------------AGCGTCCTCAGCGGAATGATGCCCAGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R M H L G H K T V V D Q L V F Y Q Q E M D V K
G R M H L G H K T V V D Q L V F Y Q Q . . . . K
GGCCGAATGCACCTCGGCCACAAGACGGTCGTCGATCAACTAGTGTTTTACCAGCAG------------AAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V Y V P I A D L E A H H A R N M D L D R A H R I
V Y V P I A D L E A - - - - - - - - - - - H R I
GTGTACGTTCCCATCGCCGACCTGGAGGCA---------------------------------CACAGGATC
121122123124125126127128129130131132133134135136137138139140141142143144
A V E E Y V L N Y A A L G L D L D P D R C E I Y
A V E . Y V L N Y A A L . . . . . . . . C E I Y
GCCGTCGAA---TACGTCCTCAACTACGCCGCGTTG------------------------TGTGAGATCTAC
145146147148149150151152153154155156157158159160161162163164165166167168
L Q S E R K T V Q R M A L L L A G R L T W N T V
L Q S E - - - - - - - - - - - - - - - - - - - -
CTCCAATCCGAG------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K N T Y G F T G E T N M G H A F A P I V Q A A D
- - - - - - - - - - - - - - - F A P I V Q A A D
---------------------------------------------TTCGCGCCGATCGTCCAAGCCGCCGAT
193194195196197198199200201202203204205206207208209210211212213214215216
I L H P Q E I E G P H R V L V P V G V D Q D P H
I L - - - - - - - - - - - L V P V G V D Q D P H
ATACTA---------------------------------CTCGTACCCGTAGGCGTCGATCAGGACCCTCAC
217218219220221222223224225226227228229230231232233234235236237238239240
L R L T R D I A E K E D L I K P A S T Y H R F M
L R L T R D I A E K E - - - K P A S T Y - - - -
CTCCGGTTGACTCGGGATATAGCGGAAAAGGAG---------AAGCCGGCCAGCACGTAC------------
241242243244245246247248249250251252253254255256257258259260261262263264
T G L T G G K M S S S K P N T A I F L T D D P E
- - - - - - K M S . . . . . . . . . . . . . . .
------------------AAAATGTCC---------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T A K E K V W N A K T G G G A T L E E H R E H G
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G N P D E C V V Y E L M V Y H L A D R I G G D E
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K L R E I R K K C R E G D I I C G E C K R M V G
. . . . . . . . . . . . . . . . . . . K . . . .
---------------------------------------------------------AAA------------
337338339340341342343344345346347348349350351352353354355356357358359360
E A L A E I L E E L E R R R E D V R D E L P D L
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
361362363364365366367368369370371372373374
L S Q H P D A P E V P E D W
. S - - - - - - - - - - - -
---TCA------------------------------------
Class I
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_trp_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D P W G S A K L E Y Q D L I E N F G V R P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S E V L D E V P E P S W L M R R G I I F G H R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y E R I I S A M K K G E D F A V V T G M M P S G
- - - - - - - - - - - - - - A V V T G M M P S G
------------------------------------------GCGGTTGTAACAGGGATGATGCCAAGCGGA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R M H I G H K M I V D Q L R W Y D R M G A E I F
R M H I G H K M I V D Q L R W Y D R . . . E I F
AGGATGCATATAGGCCACAAGATGATCGTGGACCAGCTCAGATGGTACGACAGG---------GAGATATTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I P I A D M E A Y S A R G V D F E D S R R I A I
I P I A D M E . . S - - - - - - - - - R R I A I
ATACCCATAGCAGACATGGAG------TCA---------------------------AGGAGGATAGCCATT
121122123124125126127128129130131132133134135136137138139140141142143144
E E Y I A G Y I A L G L D L E K D N I H V Y L Q
E . Y I A G Y I A L . . . . . . . . I H V Y L Q
GAG---TACATCGCAGGGTACATTGCCCTC------------------------ATACACGTCTACCTCCAG
145146147148149150151152153154155156157158159160161162163164165166167168
S E N L M V E D L A Y V L A G K V N F N E L R A
S E - - - - - - - - - - - - - - - - - - - - - -
TCAGAG------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I Y G F T G S T S M A H M Y A P I I Q V S D I L
- - - - - - - - - - - - - Y A P I I Q V S D I L
---------------------------------------TACGCCCCCATAATACAGGTCTCAGACATCCTG
193194195196197198199200201202203204205206207208209210211212213214215216
H P Q L D E L G G P R P V I V P V G P D Q D P H
- - - - - - - - - - - - - I V P V G P D Q D P H
---------------------------------------ATTGTCCCTGTGGGCCCGGACCAGGACCCCCAT
217218219220221222223224225226227228229230231232233234235236237238239240
I R L T R D I A A R F R D R Y G F I L P S S T Y
I R L T R D I A A R F - - - - - - - L P S S T Y
ATAAGGCTGACACGGGATATAGCAGCCAGGTTC---------------------CTCCCCTCATCAACATAC
241242243244245246247248249250251252253254255256257258259260261262263264
H R F M G G L T G G K M S S N R P K S A I F L S
- - - - - - - - - - K M S S N - - - - - - - - -
------------------------------AAGATGTCAAGCAAC---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D T P E E A E A K I R N A K T G G R E T L K E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R E L G G V P E E C I I Y E T L L Y H M S G S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S R L E E I Y E S C R N G T L M C G E C K N N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A E F I R K F F E E L S V K R E K A L P A A R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364
I L E G
- - - -
------------
Class I
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_trp_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E E E F V V T P W E V R G R V D Y E K L L K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F G A K P L T K D E V A L L E K Y A G E V H P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I R R G F F Y A H R D F D F I M K W H G E G R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W A L Y T G R G P S G P V H I G H M V P W I L L
- A L Y T G R G P S - P V H I G H M V P W I L L
---CTCCGGGTTCCCCCCGTATTTCCTCTG---CTCTGCTGTTGGCCTGCCCCCGGTGAAGGCGTTCATTAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K W F S D K F G L E V Y F Q I T D D E K F Y D D
K W F S D . . . . E V Y F Q I T D D E . . . . .
CTTGCGCCTCACGGT------------TAGGGTGTATATGGCGGAGTCTGGGTTTGA---------------
121122123124125126127128129130131132133134135136137138139140141142143144
P E M K L E E A T N W A Y E N A L D V I A L G F
. . . . . . . A T N W A Y E N A L D V I A L . .
---------------------GAATTTTGAGTATAGAGTTGAGGGCTTGGGGTAGCCCAGGGCATC------
145146147148149150151152153154155156157158159160161162163164165166167168
S P E R L H L I I D T K D I K P L Y P I A V R V
. . . . L H L I I D T K - - - - - - - - - - - -
------------GCGGAAGTAGGGGTCTTGATCTAT------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A K K L T W N T V K A T F G F T D S T N I G L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F Y P S L Q I A V A F L P T E L R R E A T P V L
F Y P S L Q I A V A F - - - - - - - - - - - - L
TGTAAAGCCGAAAGTCGCCTTTACTGTATTCCA------------------------------------CAG
217218219220221222223224225226227228229230231232233234235236237238239240
I P C A I D Q D P Y F R L A R D I A D A L G Y P
I P C A I D Q D P Y F R L A R D I A D A L - - -
CGGCTTTATGTCCTTCGTGTCTATTATTAAATGCAGCCTCTCTGGGGAGAAACCTAGGGCAAT---------
241242243244245246247248249250251252253254255256257258259260261262263264
K P S T L Y S K F I M A L T G E S K M S A S N P
K P S T L Y - - - - - - - - - - - K M S A S - -
GGCGTTTTCATACGCCCA---------------------------------GTCGTAGAACTTCTC------
265266267268269270271272273274275276277278279280281282283284285286287288
D S A I Y T L D D E K T V R R K V M N A F T G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R P T A E E Q R K Y G G N P E V C P V F H Y H M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L F D P D D A S V E K I R Q D C K S G A L L C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E C K L K L H E K I T K F L K E H R E R R E K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375
R G K V D E Y R L S V K L S K
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_trp_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D T K L D P W S S S D I T D Y S K L F E E F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I S P F E N V L P E I P S P H M Y M R R K V I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G H R D Y E Q I A E A M R T G A P F S V M D G F
- - - - - - - - - - - - - - - - - - S V M D G F
------------------------------------------------------TTCAAAGACCGAACATTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M P S G K V H L G H K M V M D Q I V W H Q E M G
M P S G K V H L G H K M V M D Q I V W H Q E . .
CTCGGGTTTTCCTCCCAGTTTTTTCTGCTCTTCGAGGGTTACGCAGCCCCCGGTTTTTGCCCGCTT------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A S A F V G I A D R E A F S V R G F S W Q K C R
. S A F V G I A D R E . . . . . . . . . . . C R
---TGCCCCTTCCTTCGGGGAGTCCGTAAGGGC---------------------------------CCCACC
121122123124125126127128129130131132133134135136137138139140141142143144
E I G V E E Y I L S L I A L G F K P D G L I Y F
E I G V E . Y I L S L I A L G - - - - - L I Y F
CTGCAGTCCGCTCAT---CCTGTGGTAGGTGGAGGCTGGAGGAAT---------------GAACTCGACTGT
145146147148149150151152153154155156157158159160161162163164165166167168
Q S G C G S V K D L A F E L G A K V N F S E L S
Q S G - - - - - - - - - - - - - - - - - - - - -
GACTTCCCT---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A I Y G F S G E T S L S H M L S V A T Q A A D I
- - - - - - - - - - - - - - L S V A T Q A A D I
------------------------------------------CTCTTTCTGGGCGGTTTTTCCCCTGACGCT
193194195196197198199200201202203204205206207208209210211212213214215216
L Q P Q L E E F G G P K P V V V P V G P D Q D P
L - - - - - - - - - - - - - V V P V G P D Q D P
CAG---------------------------------------CCTGAACATGTTCATCTTGCCTGCAAGCCC
217218219220221222223224225226227228229230231232233234235236237238239240
H L R L T R G L A G K M N M F R V E E R E D V K
H L R L T R G L A G - - - - - - - - - - - - - -
TCTTGTCAGGCGGAGGTGAGGGTCCTGGTC------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T G R K Y L S V R G K T A Q K E A L Q E L K K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I P G K V K L Y E E H I D V L E Y P D L A G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K L V R E V T V E F G G Y A F I P P A S T Y H R
- - - - - - - - - - - - - - - - P P A S T Y - -
------------------------------------------------GAGGGCAATAAGGCTTAA------
313314315316317318319320321322323324325326327328329330331332333334335336
F M S G L Q G G K M S S S I P E S Q I A L T D S
- - - - - - - - K M S S S - - - - - - - - - - -
------------------------CTTCTGCCAGGAAAA---------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P K E G A K K V K R A K T G G C V T L E E Q K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L G G K P E E C S V F E L M L F H L I A S D E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L L E I K Q E C I S G T R M C G S C K Q L A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K M Q E F L K D H Q E K R E L A R E H L D E Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437
I I Y K D
- - - - -
---------------
Class I
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_trp_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A K V T P W E V Q I K D E S D Y Q R L I E I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G V K P I D E K L K E K L K E Y T K E L H P L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E R N I F Y A H R D L D L V L K D Y E E G R G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F L Y T G I A P S K G K M H I G H L V P F I L T
F L Y T G I A P S K . K M H I G H L V P F I L T
CCAAAAGAACACAACATCTATATCTGGGTT---TCCATATTTTCTATGTAATTCCAAAGTAGGTTGCCCTCC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R W F Q E K F D V N V Y I M F P D E E K Y W A K
R W F Q E . . . . N V Y I M F P D E E . . . . .
AGAAAAGGCTTTCAT------------TACTTCTTCATAGCTATCATCTAAAAATAT---------------
121122123124125126127128129130131132133134135136137138139140141142143144
K V D D Y K E V R R K I K E M H A K Y I A A L G
. V - - - - - - R R K I K E M H A K . I A A L .
---AGA------------------CCCCCTTAATCCCCAAATCATTTTGCTTAA---TTCTGCAGCTTT---
145146147148149150151152153154155156157158159160161162163164165166167168
F D P D K T F M F I N S E Y I K H L Y S A A I P
. . . . . T F M F I N S E - - - - - - - - - - -
---------------AGCTATGTCTCTTTGAAGTCTAAA---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I A R H I N L S Q A R A V F G F N D S T S V G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V F Y T V L Q I V P T F F E N K R P L I P A G I
- F Y T V L Q I V P T F - - - - - - L I P A G I
---ATTAAACCCAAATACTGCTCTCGCTTGTGATAA------------------TGGTATCGCTGCAGAGTA
217218219220221222223224225226227228229230231232233234235236237238239240
D Q D P Y F R L Q R D I A P K L N K Y K A A E I
D Q D P Y F R L Q R D I A P K L - - - K A A E I
TAAATGTTTTATATATTCAGAATTAATGAACATAAAAGTTTTGTCTGG---------CAATGCCGCAATATA
241242243244245246247248249250251252253254255256257258259260261262263264
L S K M I W G L R G P Y T K M S S S D P D S A I
L - - - - - - - - - - - - K M S S S - - - - - -
TTT------------------------------------ATAATCATCAACTTT------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F L D D S Y E E V K R K I M K A F S G G Q P T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E L H R K Y G G N P D I D V V F F W L K A L F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E D T K K L K E L E Q S Y R E G T L T T G E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q Y A I E K I W R F L K D L Q E K A K K V D I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377
K Y F Y D G K L A K Q M W E W E L
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_trp_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I N P W S S S D F F D Y E R L K R E F G I G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M N V P F D H F L F R R H L I L G Q R S I D Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D Y A L K H H M K F N V M T G L M P S G E M H L
- - - - - - - - - - N V M T G L M P S G E M H L
------------------------------AACGTTATGACTGGCCTCATGCCTTCAGGAGAGATGCATCTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G N K S A I D Q V I F F Q K L G G R V S I A V A
G N K S A I D Q V I F F Q K . . . R V S I A V A
GGCAACAAGAGCGCCATAGACCAGGTCATCTTCTTCCAGAAG---------AGGGTTTCCATAGCGGTGGCT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D L E S Y S T R G I S L E R A R E V A I E K Y I
D L E . . . . . . . . . . . A R E V A I E . Y I
GATCTCGAA---------------------------------GCCAGGGAAGTTGCCATAGAG---TACATA
121122123124125126127128129130131132133134135136137138139140141142143144
L N Y I A M G L E P C E I Y F Q S R N S D V Q F
L N Y I A M . . . . C E I Y F Q S R - - - - - -
TTGAACTACATTGCCATG------------TGCGAGATATATTTTCAGTCCAGA------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L A Y M L G N R T N M S E L R S L Y G F T D T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D L L H I N A P L I Q A A D V L H T Q M K K Y G
- - - - - N A P L I Q A A D V L - - - - - - - -
---------------AATGCGCCGCTGATACAGGCCGCAGACGTACTG------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G P A P T V V P V G F D Q D P H L R L M R D L A
- - - - - V V P V G F D Q D P H L R L M R D L A
---------------GTCGTGCCTGTTGGCTTCGATCAGGACCCGCACCTGAGATTGATGAGGGACCTTGCC
217218219220221222223224225226227228229230231232233234235236237238239240
K R M R I F N I Q L E N D L V V S V R G K D D P
K - - - - - - - - - - - - - - - - - - - - - - -
AAG---------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K E Y I D M A Y E Y L S S R Y T N V K K D Y E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R V V R A D G V D Q Q D L V G I D L D L A H M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T K Y N D F A F I A P S A T Y Q K L M K G L K G
- - - - - - - - - A P S A T Y - - - - - - - - -
---------------------------GCTCCGTCTGCAACATAC---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G K M S S S V P D S L I S L N D D P K E A R R K
- K M S S S - - - - - - - - - - - - - - - - - -
---AAGATGTCTTCATCC------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I M A G M T G G R D T E E E Q R R L G G E P D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
C P I F D L Y N Y E I D D D K H V K E V Y D D C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R N G K R M C G F C K R E I A D R M A S W L S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426
L S K K R E E A R E K L S L Y I H E
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Archaeoglobus fulgidus/amino acid sequences/trp_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N V T P W E V E G V I D Y S K L I E E F G M Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P F S E V L P E I D N P H I L M R R G A I F G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R D Y W R I I E A M R K K E P W A V M S G F M P
- - - - - - - - - - - - - - - - A V M S G F M P
------------------------------------------------GACCACACATCTATCCGGCTCACC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S G L P H F G H K M T M D E I V W H Q S A G G K
S G L P H F G H K M T M D E I V W H Q S . . . K
GCCAAGCCTTCTCTGCTCCTCGGCTGTCGCCCTTCCACCCGTGAAGGCCTTCATGACCTT---------CTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A F V A I A D M E A H S V R G L S W E K T R E L
A F V A I A D M E . . . . . . . . . . . T R E L
TTCAGGAGGGTCGAGGAGGGAGATGTA---------------------------------AGTAAGCCCTGT
121122123124125126127128129130131132133134135136137138139140141142143144
G M L Y I K S I I A L G L R E D A V I Y F Q S K
G M - Y I K S I I A L . . . . . A V I Y F Q S K
CGTAAA---GTGGTAGGTTGAGGATGGGGGAAT---------------AATTTCAACCTCTATCTTTCTCAC
145146147148149150151152153154155156157158159160161162163164165166167168
S S H V K D L A F E L S A E V N F S E L R A I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G F N S D T S L A K M F V T A I Q A A D I L H P
- - - - - - - - - - - F V T A I Q A A D I L - -
---------------------------------CCTGCTCCTAACTCTCACTCCTCCTTCAACTGG------
193194195196197198199200201202203204205206207208209210211212213214215216
Q L E E F G G P K P V V V P V G A D Q D P H M R
- - - - - - - - - - - V V P V G A D Q D P H M R
---------------------------------CGTCAGTCGCATGTGGGGGTCCTGATCAGCCCCAACAGG
217218219220221222223224225226227228229230231232233234235236237238239240
L T R D L A A R I S I F S F E P V E G G V R V R
L T R D L A A R I - - - - - - - - - - - - - - -
CACCACCACTGGCTTTGGCCCTCCAAA---------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S R K G A E Y L S S L R D L E F D K K I Y E E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
M D I F G E A E E I E R A V R K I E V E I G G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A F I P P S S T Y H R F T T G L T G G K M S S S
- - - P P S S T Y - - - - - - - - - - K M S S S
---------GGCGATGATGGATTTGAT------------------------------CCAGCTCAAACCCCT
313314315316317318319320321322323324325326327328329330331332333334335336
K P E S Y I S L L D P P E E G A K K V M K A F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G G R A T A E E Q R R L G G E P D R C V V F E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y S F H L I D S D E E L N Q I E A E C R E G R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L C G K C K K M A A E L V K S F L K E H Q E K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420
E A V D L S N Y T I I G
- - - - - - - - - - - -
------------------------------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_trp_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K T E V V N P W A S D Q S V D I E R L H A E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G I E R I E T V I D L L P E T P D F I R R G I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F G H R D Y H Q I A N A I R T N E P F N V M T G
- - - - - - - - - - - - - - - - - - - N V M T G
---------------------------------------------------------ACACTTGTCTGCCTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F M P S G H P H L G H L M V M K E V V W H V Q Q
F M P S G H P H L G H L M V M K E V V W H V Q .
CCCTCCCAGCTCTTTCTGTTCCTGGAGTGTCATCCGGCCACCGGTCAGGGCTGCCATGATCTTTCTGGT---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G G R G Y I C I A D R E A H A V R N L T W E Q C
. . R G Y I C I A D R E . . . . . . . . . . . C
------GTCATCCTCATAAAACCCGATGATACTCTC---------------------------------ACC
121122123124125126127128129130131132133134135136137138139140141142143144
R K Y G D E Y L S C L Y A L G Y H G E T Y E Q S
R K Y G D - Y L S C L Y A L G - - - E T Y E Q S
GGGCATGAACCGGTG---GGTTGCGGACGGAGTGACAAACCCATA---------GGTTCGCTCTATTGCCCT
145146147148149150151152153154155156157158159160161162163164165166167168
S N R V V Q D L A F E A S A K V N F S E L S A I
S - - - - - - - - - - - - - - - - - - - - - - -
GAC---------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y G F T P D T D I G H A M S V L T Q V A D I L H
- - - - - - - - - - - - M S V L T Q V A D I L -
------------------------------------GGCTTCTTTTGACCGGACACTGACATGGGTGTC---
193194195196197198199200201202203204205206207208209210211212213214215216
P Q V N E E P A P T I V P V G L D Q D P H I R L
- - - - - - - - - - I V P V G L D Q D P H I R L
------------------------------AGCTACTCCTCTTGTCAGACGGATATGCGGATCCTGGTCAAG
217218219220221222223224225226227228229230231232233234235236237238239240
T R G V A H K L R M F T V E D R D T H V S V R S
T R G V A H K L - - - - - - - - - - - - - - - -
CCCCACCGGCACGATGGTCGGGGC------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K E A P E E A M E A I H K A F R G S K R Y E G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I D I F N V P L D V V K K T V R A I E R T H G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y G F V T P S A T F H R F M P G L T G G K M S S
- - - - T P S A T F - - - - - - - - - - K M S S
------------GAGGCAGGAGAGGTATTC------------------------------GAGGTTTCGTAC
313314315316317318319320321322323324325326327328329330331332333334335336
S I P E S I I G F Y E D D K T V T R K I M A A L
S - - - - - - - - - - - - - - - - - - - - - - -
TGC---------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T G G R M T L Q E Q K E L G G E A D K C P V F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L N L F H M V S D D A E L A E I R R K C M A G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L M C G Q C K K D S A A R V L A F L D E F R E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422
M A V A A D Q I R S E K S C
- - - - - - - - - - - - - -
------------------------------------------
Class I
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_trp_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V E E F K V T P W E V E G V V D Y D K L I K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F G T S P L T E D L L E K T A E L T K S E L P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F F R R K F F F S H R D Y D L I L K D Y E E G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G F F L Y T G R G P S G P M H I G H I I P F F A
- - F L Y T G R G P S G P M H I G H I I P F F A
------TTCCTTTATACTGGAAGAGGACCAAGTGGGCCAATGCACATAGGGCATATAATTCCATTTTTTGCC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T K W L Q E K F G V N L Y I Q I T D D E K F L F
T K W L Q E . . . . N L Y I Q I T D D E . . . .
ACAAAATGGCTACAGGAG------------AACTTATACATCCAGATAACCGACGATGAA------------
121122123124125126127128129130131132133134135136137138139140141142143144
K E N L T F D D T K R W A Y D N I L D I I A V G
. . . . T - - - - K R W A Y D N I L D I I A V .
------------ACC------------AAACGATGGGCTTACGACAATATATTAGACATAATCGCAGTG---
145146147148149150151152153154155156157158159160161162163164165166167168
F D P D K T F I F Q N S E F T K I Y E M A I P I
. . . . . T F I F Q N S E - - - - - - - - - - -
---------------ACATTCATATTCCAAAATAGCGAA---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A K K I N F S M A K A V F G F T E Q S K I G M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F F P A I Q I A P T F F E R K R C L I P A A I D
F F P A I Q I A P T F - - - - - - L I P A A I D
TTCTTCCCAGCGATCCAAATAGCCCCCACATTC------------------CTAATCCCAGCAGCAATAGAT
217218219220221222223224225226227228229230231232233234235236237238239240
Q D P Y W R L Q R D F A E S L G Y Y K T A A L H
Q D P Y W R L Q R D F A E S L - - - K T A A L H
CAGGATCCTTATTGGAGACTACAGAGAGATTTCGCTGAAAGCCTA---------AAGACCGCAGCACTTCAC
241242243244245246247248249250251252253254255256257258259260261262263264
S K F V P S L T S L S G K M S A S K P E T A I Y
- - - - - - - - - - - - K M S A S - - - - - - -
------------------------------------AAAATGAGCGCCTCA---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L T D S P E D V E K K V W K F T L T G G R P T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K E Q R E K G G E P E K C V V F K W L E I F F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E D D K K L K E R Y Y A C K N G E L T C G E C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R Y L I S K I Q E F L K E H Q R R R K K A E K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V E K F K Y T G K L A Q E M W N E A I P E P L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386
R S
- -
------
Class I
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_trp_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E E F R L D P W A S A V R L E Y E K L F R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F G I K P F R E L L P R V T E V L G E P L H L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R R G V I F G H R D F D S V L E A Y R S G E R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L V T G F M P S G R F H F G H K M V A D Q I I
A L V T G F M P S G R F H F G H K M V A D Q I I
GCCCTTGTAACCGGCTTCATGCCCAGCGGCCGCTTCCACTTCGGCCACAAGATGGTGGCGGATCAGATAATA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y Y Q K L G F E I F I V I A D A E A Y A V R K L
Y Y Q K . . . E I F I V I A D A E . . . V - - -
TACTACCAGAAG---------GAGATATTCATTGTTATAGCTGACGCGGAG---------GTC---------
121122123124125126127128129130131132133134135136137138139140141142143144
D R R K V I E T G L Y E Y V A N L I A L G L E K
- - - - - I E T G L Y . Y V A N L I A L . . . .
---------------ATAGAGACGGGCCTCTAC---TACGTTGCCAACCTCATAGCCCTG------------
145146147148149150151152153154155156157158159160161162163164165166167168
N R H T H I Y F Q T N Y E T P Y Y R L I Q M F S
. . . T H I Y F Q T N - - - - - - - - - - - - -
---------ACCCACATATACTTCCAGACCAAC---------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R K I T M A E M E A I Y G D L E P G K V M A A L
- - - - - - - - - - - - - - - - - - - - M A A L
------------------------------------------------------------ATGGCCGCGCTC
193194195196197198199200201202203204205206207208209210211212213214215216
T Q A A D I L H P Q L D Y F G G F K H V L V P V
T Q A A D I L - - - - - - - - - - - - - L V P V
ACCCAGGCTGCAGACATACTA---------------------------------------CTCGTACCCGTT
217218219220221222223224225226227228229230231232233234235236237238239240
G A D Q D P H I R L A R D I A D R F E N E L G L
G A D Q D P H I R L A R D I A D R F - - - - - -
GGAGCCGATCAAGACCCACACATAAGGCTTGCAAGAGATATCGCTGACAGGTTT------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R R P A S T Y H R F Q S G L D G N K M S S S R P
- R P A S T Y - - - - - - - - - - K M S S S - -
---AGGCCGGCCTCGACCTAC------------------------------AAGATGAGCAGCTCT------
265266267268269270271272273274275276277278279280281282283284285286287288
D Y T I F L S D P I D V A V R K L K N A L T G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R A T V E E Q R R L G G E P E K C T V Y E F Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y H L V R D D K K L A R I Y Q E C R G G R L L C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G P D K Q Y A A E L L A K F L E E H Q R K L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374
A K D R V L E Y V E P P S F
- - - - - - - - - - - - - -
------------------------------------------
Class I
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_trp_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T D D S V T P Y A V E G D V D Y E K L L A R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G A D A L A D D Q R E R F P D H P L V R R G L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y A G R G V D D F L D A E V Q S I V T G I G P S
- - - - - - - - - - - - - - - S I V T G I G P S
---------------------------------------------TCCATCGTCACCGGCATCGGGCCGTCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G P M H L G H A M V F Y F A K R L Q D E L G A R
G P M H L G H A M V F Y F A K R L Q D . . . . R
GGCCCGATGCACCTCGGCCACGCGATGGTGTTCTACTTCGCGAAGCGCCTGCAGGAC------------CGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V Y V P L S D D E K Y W F K D Q T P A E T G D Y
V Y V P L S D D E . . . . . . . T - - - - G D Y
GTCTACGTCCCGCTCTCGGACGACGAG---------------------ACG------------GGCGACTAC
121122123124125126127128129130131132133134135136137138139140141142143144
L R E N L R D L L A V G F D P D L T R F V V D T
L R E N L R D L L A V . . . . . . T R F V V D T
CTCCGGGAGAACCTGCGGGACCTGCTCGCCGTC------------------ACGCGCTTCGTCGTGGACACG
145146147148149150151152153154155156157158159160161162163164165166167168
K D A D V V Y P L A T A F G K D I T H S T L E S
K - - - - - - - - - - - - - - - - - - - - - - -
AAA---------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V Y G T P E N V G Q G F Y P A V Q T A H L L L P
- - - - - - - - - - - F Y P A V Q T A H L L - -
---------------------------------TTCTACCCCGCGGTCCAGACGGCCCACCTGCTG------
193194195196197198199200201202203204205206207208209210211212213214215216
Q L V H G E H E T L V P I A V D Q D P H V R V S
- - - - - - - - - L V P I A V D Q D P H V R V S
---------------------------CTCGTCCCCATCGCGGTGGACCAGGACCCCCACGTGCGGGTGAGC
217218219220221222223224225226227228229230231232233234235236237238239240
R D V A A K A R Y P V G K P G A L L M Q F L P S
R D V A A K A - - - - - K P G A L L - - - - - -
CGCGACGTCGCCGCGAAAGCC---------------AAGCCCGGCGCGCTGCTG------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L G G P G K M S S S E G V A I R L T D D P D T V
- - - - - K M S S S - - - - - - - - - - - - - -
---------------AAGATGAGCAGTTCC------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R Q K I R K H A Y T G G Q S S V E A H R E Q G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D P E V D V P F Q Y M S A F F E P D D D E L A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V E R E Y R A G D L L S G E L K E L A A D R I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E F L E G H Q D R R D E L D D V E A E L P A Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377
L T E N E R G R A R D A V G F G Y
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Bacteria/Escherichia coli/amino acid sequences/Ecoli_trp_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T K P I V F S G A Q P S G E L T I G N Y M G A
- - - - I V F S G A Q P S G E L T I G N Y M . A
------------CACAAAACCAATCGCTTCGTACACCGCTTTTAGCGTACGGGAAGCGTGTGCGCT---TTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L R Q W V N M Q D D Y H C I Y C I V D Q H A I T
L R Q W V N M Q D D - H C I Y C I V D Q H - - -
TTCTGCGCCGTCTTTCATCACCTGTTGCAG---GGCTTCATCGTTGCGGAAACGGTGGTAACG---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V R Q D A Q K L R K A T L D T L A L Y L A C G I
- - - - - - - - R K A T L D T L A L Y L A C . .
------------------------ATCAGCCACTTCACCTTTCAGATGACCATACATCTTGCCTTC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D P E K S T I F V Q S H V P E H A Q L G W A L N
. . . . S T I F V Q S H - - - - - - - - - - - -
------------CGGGATGCTCTGGCCCGTTACCGC------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C Y T Y F G E L S R M T Q F K D K S A R Y A E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I N A G L F D Y P V L M A A D I L L Y Q T N L V
- - - - - - D Y P V L M A A D I L - - - - - L V
------------------CAGGCCGATAACGTTATTGCGGTTATCGTCAGA---------------GGTCGG
145146147148149150151152153154155156157158159160161162163164165166167168
P V G E D Q K Q H L E L S R D I A Q R F N A L Y
P V G E D Q K Q H L E L S R D I A Q R F - - - -
CTCCAGCAGCGACATTACGCGCGCGCCAGATTTCGGAATAAACGGCTCTGGCACCTTAAA------------
169170171172173174175176177178179180181182183184185186187188189190191192
G D I F K V P E P F I P K S G A R V M S L L E P
- - - - - - P E P F I P - - - - - - - - - - - -
------------------GGCGATATCGCGGCTCAG------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T K K M S K S D D N R N N V I G L L E D P K S V
- - K M S K S - - - - - - - - - - - - - - - - -
------AGTTTGATACAGCAG---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V K K I K R A V T D S D E P P V V R Y D V Q N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A G V S N L L D I L S A V T G Q S I P E L E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F E G K M Y G H L K G E V A D A V S G M L T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q E R Y H R F R N D E A F L Q Q V M K D G A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334
A S A H A S R T L K A V Y E A I G F V A K P
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_trp_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N R K P R V F S G I Q P S G N L H I G N Y L G
- - - - - R V F S G I Q P S G N L H I G N Y L .
---------------CGGCAACACAAAACCCACCCGTTCAAGGATCAGGGTCATCTTGGGTTCGGCGAC---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A I Q Q W V A G Q G Q K T N F I C I V D L H A I
A I Q Q W V A G Q G Q - T N F I C I V D L H - -
ACGCGCCTGTTCGGCGCCAATCGCTAAAATGCG---TAGCTCTGCCGGATCGTCCATCAACTGATA------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T V P Q E P A A L H R Q T R E L A A L L L A C G
- - - - - - - - - H R Q T R E L A A L L L A C .
---------------------------CACAACCTCGGCCAATTCACTTTTTAGTGCGCCATACCCTTT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I D P Q Q T T L F V Q S H V R A H A E C A W V F
. . . . . T T L F V Q S H - - - - - - - - - - -
---------------GATCTCAGGCCGACTTTTTCCGGT---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S C L T P L G W L E R M T Q Y K T K A Q K Q E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V M T G L L T Y P V L M A A D I L L Y D A D E V
- - - - - - T Y P V L M A A D I L - - - - - E V
------------------ATCGACGATCCGAATAGCATGACCGCGAGTGGT---------------CTTGGA
145146147148149150151152153154155156157158159160161162163164165166167168
P V G E D Q K Q H I E L T R D L A Q R F N Y L Y
P V G E D Q K Q H I E L T R D L A Q R F - - - -
CGTCGGATCGTTCAAGCCCATAATGCGGGCTCCGCTCTCACGGATGACCGGCTCAGGAAT------------
169170171172173174175176177178179180181182183184185186187188189190191192
G E T F V I P E P V I R E S G A R I M G L N D P
- - - - - - P E P V I R - - - - - - - - - - - -
------------------CCGCTGTGCCAGATCGCG------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T S K M S K S D T T R G H A I R I V D E P D E I
- - K M S K S - - - - - - - - - - - - - - - - -
------CTCATCGGCGTCATA---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R W A I K R A V T D S Y N E I R F S D D P D R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G V N N L L Q I Y E L L T G K S R P E I E A H F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A G K G Y G A L K S E L A E V V I E S L R P I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E R Y Y Q L M D D P A E L D R I L A I G A E Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R A V A E P K M T L I L E R V G F V L P N D R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class I
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_trp_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R V L T G L Q P S G D L H I G N Y F G A I K Q
- R V L T G L Q P S G D L H I G N Y F . A I K Q
---AGAGTATTAACAGGCCTTCAGCCAAGTGGCGATTTGCATATAGGTAATTATTTT---GCGATTAAGCAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M V D A Q E K S Q M F M F I A N Y H A M T S S Q
M V D A Q E K - Q M F M F I A N Y H - - - - - -
ATGGTAGATGCACAAGAAAAA---CAAATGTTTATGTTTATTGCTAATTATCAT------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D G E K L K Q N S L K A A A A F L S L G I D P Q
- - - - - K Q N S L K A A A A F L S L . . . . .
---------------AAACAAAATTCCTTAAAAGCTGCTGCGGCTTTTTTAAGCCTT---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K S V F W L Q S D V K E V M E L Y W I L S Q F T
. S V F W L Q S D - - - - - - - - - - - - - - -
---AGCGTTTTTTGGTTGCAAAGTGAT---------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P M G L L E R A H S Y K D K V A K G L S A S H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L F S Y P V L M A A D I L L F D T R I V P V G K
- - S Y P V L M A A D I L - - - - - I V P V G K
------TCTTATCCTGTTTTAATGGCGGCAGATATTTTA---------------ATTGTCCCTGTAGGAAAA
145146147148149150151152153154155156157158159160161162163164165166167168
D Q I Q H V E I A R D I A L K V N N E W G E I F
D Q I Q H V E I A R D I A L K V - - - - - - - -
GATCAAATCCAGCATGTTGAAATCGCACGCGATATTGCTTTAAAAGTT------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T L P E A R V N E E V A V V V G T D G A K M S K
- - P E A R V N - - - - - - - - - - - - K M S K
------CCAGAAGCGAGAGTTAAT------------------------------------AAAATGAGTAAA
193194195196197198199200201202203204205206207208209210211212213214215216
S Y Q N T I D I F S S E K T L K K Q I S S I V T
S - - - - - - - - - - - - - - - - - - - - - - -
TCT---------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D S T A L E D P K D H E N C N I F K I A K L F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D E S G Q K E L Q I R Y E K G G E G Y G H F K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y L N E L V N A Y F K E A R E K Y N E L L E K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S H L K E I L D F G A T K A R K I A Q E K M Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319
I Y E K I G L
- - - - - - -
---------------------
Class I
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_trp_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K D A A S V T P G R R R I L T G L Q P S G Q
- - - - - - - - - - - - - R I L T G L Q P S G Q
---------------------------------------GCCGGCGAGGACCGCGTTCGCGGCGGCGGCTCC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L H L G N Y C G A I Q P L L G L Q E A A A A G E
L H L G N Y C . A I Q P L L G L Q E A - - - - -
CTCGCGGAGCACGCCGTCGAC---CGCGTCGTCCCGGAGGATCTCCGCCCGCCGGGC---------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R K L F V F V A S Y H A L T S V A D P A V L R A
- K L F V F V A S Y H - - - - - - - - - - - R A
---GTCCATGACCAGTTCGAAGAGAGCCTGCTT---------------------------------CGCCCG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N C R R V V I D Y L A F G L D P A K I N L Y L Q
N C R R V V I D Y L A F . . . . . . I N L Y L Q
GTACCGGTCCGCGAGGGCGAGCGTCCGCAGGTCGTC------------------GAAGATCCGGAACACGGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q D V P A V T E L A W L L A C V C P K A A M D R
Q D - - - - - - - - - - - - - - - - - - - - - -
CGAAGC------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A V A Y K E K V D R G A K P S L G L F T Y P V L
- - - - - - - - - - - - - - - - - - - T Y P V L
---------------------------------------------------------CCCGTCGACGCCCGG
145146147148149150151152153154155156157158159160161162163164165166167168
Q A A D I L G V R P D A V P V G A D Q T Q N V E
Q A A D I L - - - - - A V P V G A D Q T Q N V E
CAGCGTCCCGCCGTCGGC---------------GGGCACCTTGAAGACATCGCCGTAGGTCCGGTTGAACCG
169170171172173174175176177178179180181182183184185186187188189190191192
Y A R D L A G R F N R T Y G D V F K V P E L L V
Y A R D L A G R F - - - - - - - - - - P E L L V
CCCCGCCAGGTCGCGGGCGTACTCGAC------------------------------GGCGTCGGGCCGAAC
193194195196197198199200201202203204205206207208209210211212213214215216
R A D G G T L P G V D G E K M S K S Y G N T I D
R - - - - - - - - - - - - K M S K S - - - - - -
GCC------------------------------------CAAGCCCAGCGAAGG------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P F M D E K P L R K R I M K I K T D S A D P A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A K D P E A S A V F R I F S Q I A G A D D L R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L A L A D R Y R A S G E A G M G Y G E A K Q A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F E L V M D H F G P A R A R R A E I L R D D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V D G V L R E G A A A A N A V L A G V M D D A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342
R A C G L R
- - - - - -
------------------
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_trp_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K S S G T I V L C S H L D S A C P M G K P R V
- - - - - - - - - - - - - - - - - - - - - - R V
------------------------------------------------------------------CGCGTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L S G V Q P T G N L H L G N Y L G A I R N W V E
L S G V Q P T G N L H L G N Y L . A I R N W V E
CTTTCCGGCGTTCAACCGACCGGCAACTTGCACCTCGGCAACTATCTC---GCGATTCGCAATTGGGTCGAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G Q Q Q Y D N F F C V V D L H A I T V P H E A A
G Q Q Q - D N F F C V V D L H - - - - - - - - -
GGCCAACAGCAG---GACAACTTTTTCTGTGTGGTTGATCTGCAT---------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S L A E N T Y R T A A L Y L A C G I D L S C S T
- - A E N T Y R T A A L Y L A C . . . . S - - T
------GCCGAAAACACCTATCGGACGGCGGCGCTCTATCTCGCCTGC------------AGC------ACC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I F V Q S H V P A H S E L T W L L N C I T P L N
I F V Q S H - - - - - - - - - - - - - - - - - -
ATTTTTGTCCAGTCTCAT------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
W L E G M I Q F K E K A L K Q G E N V S T G L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D Y P V L M A A D I L L Y D A D R V P V G E D Q
D Y P V L M A A D I L - - - - - R V P V G E D Q
GATTACCCCGTGCTGATGGCAGCAGATATTCTG---------------CGCGTGCCGGTGGGCGAAGACCAA
169170171172173174175176177178179180181182183184185186187188189190191192
K Q H L E L T R D I A V R I N H L F G R D D T P
K Q H L E L T R D I A V R I - - - - - - - - - -
AAGCAACACTTGGAGTTGACCCGCGACATTGCGGTTCGCATC------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I F K L P E P L I P K A G A R V M S L T D G T K
- - - - P E P L I P - - - - - - - - - - - - - -
------------CCGGAGCCATTGATTCCC------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K M S K S D P T E L S R I N L L D P P E L I E K
K M S K S - - - - - - - - - - - - - - - - - - -
AAAATGTCGAAGTCC---------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K V K R C K T D P Q R G L E F D N P D R P E C N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N L L S L Y A I L S G R S R E T V A A E C A D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G W G Q F K P L L A E A A I E A L R P I Q T K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E E V R S E P G Y L D S V L K Q G R E R A S E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355
A N A T L R R V Q D A L G F S R P V A
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_trp_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G K E K I I L T G D R P T G K L H I G H Y V G
- - - - - I I L T G D R P T G K L H I G H Y V .
---------------ATCATATTAACAGGCGACCGTCCTACCGGAAAGCTCCACATCGGACACTACGTA---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S L K R R V E L Q N S G S F D K T F I F I A D A
S L K R R V E L Q N S - - - D K . F I F I A D A
TCGCTGAAACGGAGAGTCGAACTGCAAAACTCC---------GACAAA---TTCATCTTCATTGCCGATGCA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q A L T D N I D N P E K V R Q N V I E V A L D Y
Q - - - - - - - - - - - - R Q N V I E V A L D Y
CAG------------------------------------CGTCAGAACGTAATTGAAGTAGCTCTCGATTAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L A C G L D P E K S T I F I Q S Q I P E L C E L
L A C . . . . . . S T I F I Q S Q - - - - - - -
CTGGCTTGC------------------TCAACCATCTTCATCCAGTCCCAG---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T F Y Y M D L V T V S R L Q R N P T V K T E I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
M R N F E T S I P V G F F T Y P I S Q A A D I T
- - - - - - - - - - - - - T Y P I S Q A A D I T
---------------------------------------ACTTACCCCATCAGTCAGGCTGCCGACATCACT
145146147148149150151152153154155156157158159160161162163164165166167168
A F R A T T V P V G E D Q E P M I E Q A R E I V
- - - - - T V P V G E D Q E P M I E Q A R E I V
---------------ACCGTACCGGTTGGTGAAGACCAGGAGCCCATGATCGAGCAAGCCAGAGAGATTGTC
169170171172173174175176177178179180181182183184185186187188189190191192
R R F N Y I Y G E T L V E P E I L L P D N A A C
R R F - - - - - - - - - - P E I L L P - - - - -
CGCCGTTTC------------------------------CCGGAGATCCTTTTACCG---------------
193194195196197198199200201202203204205206207208209210211212213214215216
L R L P G T D G K A K M S K S L G N C I Y L A E
- - - - - - - - - - K M S K S - - - - - - - - -
------------------------------AAGATGAGTAAATCG---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E A D E I Q K K V M S M F T D P D H L R V Q D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G K I E G N T V F T Y L D A F C R P E H F E R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L P D Y P N L N E L K A H Y Q R G G L G D V K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K R F L N S I M Q E E L E P I R N R R K E F E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D I P A I Y E M L R K G C E V A R A A A A D T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S D V R K A M K I N Y F D D A E L I N E Q V K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363
F N K
- - -
---------
Class I
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_trp_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G S L P R V F S G I Q P S G N L H L G N Y L G
- - - - - R V F S G I Q P S G N L H L G N Y L .
---------------CGGGTTTTTTCGGGCATTCAACCATCAGGCAATTTGCACCTTGGCAACTATTTG---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A I H T W V Q E Q N Q Y D N F F C I V D L H A I
A I H T W V Q E Q N Q - D N F F C I V D L H - -
GCGATTCATACCTGGGTGCAAGAGCAAAATCAA---GATAATTTCTTCTGTATTGTCGATCTGCAT------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T V P Q D P A E L R K N V R D L A A L Y L A A G
- - - - - - - - - R K N V R D L A A L Y L A A .
---------------------------CGCAAAAATGTGCGCGATTTGGCCGCGCTGTATCTGGCCGCA---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I S L E H A T I F V Q S H V P A H V E L G W I L
. . . . . A T I F V Q S H - - - - - - - - - - -
---------------GCCACGATTTTTGTCCAATCGCAT---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N C Q T P L G W L N R M T Q F K D K S Q K Q E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V A A G L M N Y P T L M A A D I L L Y D T Q V V
- - - - - - N Y P T L M A A D I L - - - - - V V
------------------AATTATCCAACGCTGATGGCTGCTGATATTTTG---------------GTTGTG
145146147148149150151152153154155156157158159160161162163164165166167168
P V G D D Q R Q H I E L T R D I A E R F N H L Y
P V G D D Q R Q H I E L T R D I A E R F - - - -
CCAGTGGGCGACGATCAACGTCAGCATATTGAGCTAACTCGCGATATTGCCGAGCGTTTT------------
169170171172173174175176177178179180181182183184185186187188189190191192
G E T F V I P E A L I R P V A A R V M G L D D P
- - - - - - P E A L I R - - - - - - - - - - - -
------------------CCCGAGGCCTTGATTCGG------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T Q K M S K S N K A A N H S I P L L G D L K A T
- - K M S K S - - - - - - - - - - - - - - - - -
------AAGATGAGCAAGAGC---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R K A M M R A V T D S G S E I K F D E T R P G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N N L L G I Y Q A L T G K D K A T I E A E F E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q G Y G K L K G A V A D V V I A T L E P L Q Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y N Q L T A D P A E L D G I L K R G A E R A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328
V A N A T L L R A Y Q Q L G L R
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_trp_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T V S V R P R I L S G V Q P S G K L H L G N Y
- - - - - - - R I L S G V Q P S G K L H L G N Y
---------------------CCCGACGGACTGCCGCACCAGTTGCAACGTGATCTGCGCCGCCGCACGGGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F G A I K Q H I E R Q D T G E C F Y F I A D Y H
F . A I K Q H I E R Q D T - E C F Y F I A D Y H
CTT---GGCGCCGGCGGTGAGCACCTCCTCGACGTACCC---GTCGCGCGCGAGTTGCTTCCGGCGCTCGCG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A L T S L K E A E E K E A G T A A K N K S I T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R P A R Q I L A E N V R D V A L D Y L A L G L D
- - - - - - - A E N V R D V A L D Y L A L . . .
---------------------CATCGGGTTCCGGTACAGGTCGGCCATCTCGGCCTGCTCGGC---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P A K A S F F R Q S D V P E V C E L A W F F S S
. A - - S F F R Q S D - - - - - - - - - - - - -
---CAG------CAGCGCAAACGCGTTGCACTT---------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V F G T A H L E R A H S Y K D K V A R G I T P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V G L F T Y P L L M A A D I L I Y R S H L V P V
- - - - T Y P L L M A A D I L - - - - - L V P V
------------GCCGTCGGTACCCGGCACGACCGCGGCTTCGTT---------------GAGCGGGAAAAT
169170171172173174175176177178179180181182183184185186187188189190191192
G K D Q E Q H L E M T R D V A G A F N N A Y G E
G K D Q E Q H L E M T R D V A G A F - - - - - -
CTCTCCGTAGGCGTTGTTGAACGCCCCGGCGACATCGCGGGTCATCTCCAGGTG------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I F P L P D G V Y N E A A V V P G T D G Q K M S
- - - - P D G V Y N - - - - - - - - - - - K M S
------------GTGCGAACGGTAGATGAG---------------------------------CAGCCCGAC
217218219220221222223224225226227228229230231232233234235236237238239240
K S Y G N T I E I F A E G K P L K N A V M G V V
K S - - - - - - - - - - - - - - - - - - - - - -
GCTCGG------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T D S T P V E E P K N P D K C N A F A L Y K L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S T A A E Q A E M A D L Y R N P M K G A E G R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G R P F G Y G D A K T L L L A K I D S Y F A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R E R R K Q L A R D P G Y V E E V L T A G A R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359
A R A A A Q I T L Q L V R Q S V G M G S R P V
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class I
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_trp_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A M R V L S G I Q S T G N L H L G N Y L G A I
- - - R V L S G I Q S T G N L H L G N Y L . A I
---------TACGGAGAAGCCCAAAGCTGTTTTAACTTTGCTCAGGGTATCGTTAGCGATCGC---TGCTTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R N W V E G Q S Q Y E N Y L F V A D L H A I T V
R N W V E G Q S Q - E N Y L F V A D L H - - - -
TTGCTTGCCATCGCGCAATACTGACTC---ATATCCCTTATCTGCCATTACCTCGTTGTA------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P H K P E E L A A N T Y T L A A L Y L A C G L D
- - - - - - - A A N T Y T L A A L Y L A C . . .
---------------------TGTTTCGGTTAGCAGTGGTTTAAATTGTCCCCAGCCCATATC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L K Y S T I F I Q S H V P A H S E L T W L F N C
. . . S T I F I Q S H - - - - - - - - - - - - -
---------TTCCTGCTTGGTTTTGCCAGATAG---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I T P L N W L E D M I Q F K E K A V K Q G E N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S V G L L D Y P V L M A S D I L L Y Q P D K V P
- - - - - D Y P V L M A S D I L - - - - - K V P
---------------ATTAATTCGACTCAACTCTGAGGGGTCTGACTT---------------TCCGTCTGT
145146147148149150151152153154155156157158159160161162163164165166167168
V G E D Q K Q H L E I T R D I A A R F N Y Q F A
V G E D Q K Q H L E I T R D I A A R F - - - - -
CAGACTCATCACCCTTGCGCCTTCTGCCCGAATCAAAGGTTCTGGTAACTTCAACAC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
R E N P V L K L P E P L I R A E G A R V M S L T
- - - - - - - - P E P L I R - - - - - - - - - -
------------------------AATGTCGCGAGTAATTTC------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D G T K K M S K S D P S E L S R I N L L D T P D
- - - - K M S K S - - - - - - - - - - - - - - -
------------TTGATAGAGTAAGAT---------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q I Q Q K I K R C K T D P I R G L V F D D P E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P E C N N L L T L Y M L L S G K T K Q E V A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
C Q D M G W G Q F K P L L T E T A I A A L K P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q D K Y N E V M A D K G Y L E S V L R D G K Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334
A A A I A N D T L S K V K T A L G F S V P L
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_trp_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I V S G M R P T G K L H L G H Y F G V I R N
- R I V S G M R P T G K L H L G H Y F . V I R N
---CGAATAGTTAGCGGAATGAGACCCACCGGGAAGCTCCATCTCGGACACTACTTC---GTTATAAGAAAC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W V K L Q E E H E C F F F I A D W H A L T T A Y
W V K L Q E E - E C F F F I A D W H - - - - - -
TGGGTGAAACTTCAGGAAGAG---GAGTGTTTTTTCTTCATAGCGGACTGGCAT------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K N T K E L R Q N I R E V M I D W L A L G L D P
- - - - - - R Q N I R E V M I D W L A L . . . .
------------------AGACAAAACATAAGGGAGGTTATGATAGATTGGCTCGCTCTG------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q K S V L F I Q S L V K E H A E L F L L F G M I
. . S V L F I Q S L - - - - - - - - - - - - - -
------AGTGTCCTCTTTATTCAATCTCTC------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T P K S W L E L N P T Y K D L K Y N L L R L T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L E K E F K E K L K E R I S E I V N L I P F N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T K E E K F R E H L L E N L T Q T M I E A L F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G E I E P E I L K R L N V S K R D F Y E T D T F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G F L G Y P V L Q A A D I L I Y K G E G V P V G
- - - G Y P V L Q A A D I L - - - - - G V P V G
---------GGATATCCAGTTCTACAAGCGGCGGACATACTC---------------GGTGTGCCCGTGGGA
217218219220221222223224225226227228229230231232233234235236237238239240
E D Q L P H I E L S R E I A R R F N R L Y G K I
E D Q L P H I E L S R E I A R R F - - - - - - -
GAGGATCAACTTCCTCACATAGAACTCTCCCGTGAAATAGCAAGAAGGTTT---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F P E P K A L L T E T P K I P G T D G R K M S K
- - - P K A L L T - - - - - - - - - - - K M S K
---------CCAAAAGCCCTCCTGACA---------------------------------AAGATGTCAAAA
265266267268269270271272273274275276277278279280281282283284285286287288
S Y G N A V F F S D E K E E V E K K V M K M F T
S - - - - - - - - - - - - - - - - - - - - - - -
TCT---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D P Q K I R K N D P G R P E I C P V F S W H K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F T K D E E L V K K I E E D C R A G R L G C V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
C K R I L L K H L E E F L E P I R E R R R E L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K R I N E I E E V F Y E N S R K A R E I A Q K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395
M E E V R K A M N L P
- - - - - - - - - - -
---------------------------------
Class I
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_trp_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F P D R I F S G M R P T G S L H L G H Y H G V
- - - - R I F S G M R P T G S L H L G H Y H . V
------------CGTATCTTTTCCGGCATGCGACCCACGGGGTCGCTCCATCTCGGCCACTATCAC---GTG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L K N W V K L Q S E Y P C F F C V V D W H A L T
L K N W V K L Q S E - P C F F C V V D W H - - -
CTGAAGAACTGGGTCAAGCTGCAGTCCGAG---CCGTGCTTCTTCTGCGTCGTCGACTGGCAT---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T H Y E T P E V I E K N V W D V L I D W L A S G
- - - - - - - - - E K N V W D V L I D W L A S .
---------------------------GAGAAGAACGTCTGGGACGTGCTGATCGACTGGCTTGCGTCG---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I D P A Q A T L F I Q S K V P E H A E L A L L L
. . . A - - T L F I Q S K - - - - - - - - - - -
---------GCG------ACGCTCTTCATCCAGAGCAAG---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G M S T P L G W L E R V P T Y K E Q I E K L K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K D L S T Y G F L G Y P V L M A A D I L L Y R G
- - - - - - - - - G Y P V L M A A D I L - - - -
---------------------------GGCTATCCGGTGCTGATGGCGGCCGACATCCTG------------
145146147148149150151152153154155156157158159160161162163164165166167168
S L V P V G E D Q V P H V E M T R E I A R R F N
- L V P V G E D Q V P H V E M T R E I A R R F -
---CTCGTGCCGGTCGGCGAGGATCAGGTGCCGCACGTCGAGATGACGCGCGAGATCGCGCGCCGCTTC---
169170171172173174175176177178179180181182183184185186187188189190191192
Y L Y G R E P G F E E K A L E A A K K L G G K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A K L Y H E L R N A Y Q Q E G D D E A L E Q A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A M L Q E S Q S L S M S D R E R L F G Y L E G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R K I I L V E P Q A L L T E A S R M P G L D G Q
- - - - - - - P Q A L L T - - - - - - - - - - -
---------------------CCGCAGGCGCTTCTGACC---------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K M S K S Y G N T I G L R E D A E T I T K K V R
K M S K S - - - - - - - - - - - - - - - - - - -
AAGATGTCGAAGTCG---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T M P T D P A R V R R T D P G D P D K C P V W Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L H Q V Y T D E A T H E W V Q K G C R S A G I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
C L D C K Q P V V E G I L R E Q Q P M L E R A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K Y M D D P S L L R A I V A D G C D K A R K Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400
T E T M R D V R E A M G L S Y S
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_trp_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K T I F S G I Q P S G S V T L G N Y I G A M
- - - T I F S G I Q P S G S V T L G N Y I . A M
---------TTTTCGGCCGAGTCCCATCGCGTTTTCCATTTTTTTTAGCATCTTGTTTGCTGT---ATTTGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K Q F V D L Q D D Y N C Y F C I V D Q H A I T V
K Q F V D L Q D D - N C Y F C I V D Q H - - - -
GCGTTCGGCGCCTTCGTCCAAAATCCG---CAGCTCTTCAGATTCGATCAATTCGTGGTA------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Q D R L A L R K N I R N L A A L Y L A I G L D
- - - - - - - R K N I R N L A A L Y L A I . . .
---------------------GACTTCGGCAAGGTCTGATTTAAATTCGCCGTAGCCTTTGCC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P K K A T L F I Q S E V P A H A Q A G W M L Q C
. . . A T L F I Q S E - - - - - - - - - - - - -
---------CTCTTCGATTGAGGCTTGTCCGAG---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V A Y I G E L E R M T Q Y K D K S A G K E A V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S G L L T Y P P L M A A D I L L Y G T D V V P V
- - - - T Y P P L M A A D I L - - - - - V V P V
------------CAGGGTGATGAACGCTTTTTGGTTCGGATCTGA---------------GAGCGGGTCGGC
145146147148149150151152153154155156157158159160161162163164165166167168
G E D Q K Q H L E L T R N L A E R F N K K Y N D
G E D Q K Q H L E L T R N L A E R F - - - - - -
AAGTGACATAATGCGGGCGCCGACCTTCGGTATTTTAACCTCCGGAACCGTAAA------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I F T V P E V K I P K V G A R I M S L A D P L K
- - - - P E V K I P - - - - - - - - - - - - - -
------------CGCCAAGTTCCGGGTTAA------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K M S K S D P N Q K A F I T L L D E P K Q L E K
K M S K S - - - - - - - - - - - - - - - - - - -
TGTTCCATAAAGCAG---------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K I K S A V T D S D G I V K Y D K E N K P G V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N L L T I Y S I L G Q A S I E E L E A K Y E G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G Y G E F K S D L A E V V I G A L K P I Q D R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H E L I E S E E L D R I L D E G A E R A N Q T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330
N K M L K K M E N A M G L G R K R R
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_trp_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K R K V M L T G D R P T G A L H L G H Y V G S
- - - - V M L T G D R P T G A L H L G H Y V . S
------------TTTTAATTTTTTCTCAGCGCTATATTTTATTCCATTCCAAGTTTTTGAAAGCCC---TAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V V N R L K F Q E E Y E T Y F I I A D L H T L T
V V N R L K F Q E E - E T Y F I I A D L H - - -
ATCCTTAACATCTTTTACTACTTTATTTGC---AAACCTCGCCTTGCTTGTACCATCAAAAAT---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T K P D L K S I N T I P S N V R E M V L D Y L A
- - - - - - - - - - - P S N V R E M V L D Y L A
---------------------------------TCTTTTATCTCTTATTGGCTTTAAAAAACTATTCAAAGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
C G I N P D K V S I Y L Q S A I P E L F E L H L
C . . . . . . V S I Y L Q S A - - - - - - - - -
TAA------------------CTCAACATCACCTACTTTACCCTT---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I F S M I V T V A R L Q R I P S I K D M S I A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G L K E I P Y G L L G Y P V L M S A D I L M T K
- - - - - - - - - - G Y P V L M S A D I L - - -
------------------------------AGACATAATTTTTTTTTCTAATAAATTTTCATC---------
145146147148149150151152153154155156157158159160161162163164165166167168
A N L V P V G R D N E S H I E F A R E L A R R F
- - L V P V G R D N E S H I E F A R E L A R R F
------TGCATTATCAAGGCTCTTGCTCATTTTATTTTTGCCATAAATACCCACCAAAGGACGAGAATCTGT
169170171172173174175176177178179180181182183184185186187188189190191192
N H L Y K N N F F P I P E S V F T D S R P L V G
- - - - - - - - - - - P E S V F T - - - - - - -
---------------------------------TTTGTACAAATGGTTAAA---------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I Y G K N K M S K S L D N A I F L N D D E N L L
- - - - - K M S K S - - - - - - - - - - - - - -
---------------TTCATTATCACGCCC------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E K K I M S M Y T D P N R I R A D I P G N V E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N P I F I Y H S F F N S N H E E V E D L K S R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K K G K V G D V E V K K K L F L A L N S F L K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I R D K R S F Y E A K K K D Y I D E I I F D G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S K A R F I A N K V V K D V K D L I G L S K T W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351
N G I K Y S A E K K L K N E E
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_trp_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P R I L T G I Q C T G R P H L G N V L G A M L
- - R I L T G I Q C T G R P H L G N V L . A M L
------CGTATACTCACAGGCATTCAATGTACAGGAAGGCCCCATTTGGGGAATGTACTG---GCCATGTTA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P T L E L A A K P T Y D T F I F L A D L H T L T
P T L E L A A . . T - D T F I F L A D L H - - -
CCTACTTTAGAATTGGCTGCC------ACC---GACACTTTTATCTTTCTGGCAGATTTACAT---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T L K D S Q E R R N Y V Y A A A A A W L A L G L
- - - - - - - - R N Y V Y A A A A A W L A L . .
------------------------AGAAATTATGTATATGCTGCTGCTGCTGCTTGGCTTGCCTTG------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D P A K V T F Y R Q S K V P A V C E L V W Y L S
. . . . V T F Y R Q S K - - - - - - - - - - - -
------------GTCACCTTTTATAGACAATCTAAA------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C F T P Y P M L A N A H A F K D K A D R M S M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S A G L F T Y P I L M A A D I L L Y H A D I V P
- - - - - T Y P I L M A A D I L - - - - - I V P
---------------ACCTACCCCATACTGATGGCAGCAGACATCTTA---------------ATAGTACCA
145146147148149150151152153154155156157158159160161162163164165166167168
V G K D Q L Q H L E I T R D I A T S F N Q Q Y G
V G K D Q L Q H L E I T R D I A T S F - - - - -
GTTGGGAAAGATCAGCTACAACATTTAGAGATTACTCGTGATATTGCCACCAGCTTT---------------
169170171172173174175176177178179180181182183184185186187188189190191192
P V F H L P Q A L I D N S I A T V P G I D G Q K
- - - - - P Q A L I D - - - - - - - - - - - - K
---------------CCCCAGGCATTAATAGAT------------------------------------AAA
193194195196197198199200201202203204205206207208209210211212213214215216
M S K S Y H N T I D I F L P E K E L R K L V M R
M S K S - - - - - - - - - - - - - - - - - - - -
ATGAGTAAATCA------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I Q T D S K S V A E S K D P D T C I V F K L Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L V A N T T D I D T M R K N Y T A G G Y G Y G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A K E E L F A T I L E R F A V A R E K F A Q Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T D I S N L E K I L M S G E A K A S V V A T E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322
L S T I R G K L G Y
- - - - - - - - - -
------------------------------
Class I
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_trp_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S R V F S G I Q P T G D P H I G N Y F G A M Q
- - R V F S G I Q P T G D P H I G N Y F . A M Q
------CTTCAGGAAGCCCACCTTCTGCCGCACTTCGTCCATCACTTCGCTGGCGATGGC---GGCTTCCTG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N Y V R L G E Q Y G K Q S L Y C V V D L H A I T
N Y V R L G E Q - - - Q S L Y C V V D L H - - -
GTCGCCCTGGCGCAGCGCGTCGCG---------GGGGTCGGCGCGGAGTTGCGCGGCCCGCGT---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N P G A F D P Q T L A Q K T F D M A V A N F A I
- - - - - - - - - - A Q K T F D M A V A N F A I
------------------------------CATCTTCTTGCAGTCCACGCAGCCGATGCCCGCCGTGCGGCA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G L D P S K V V F F V Q S H V P E H Q E L S W I
. . . . . . V V F F V Q S H - - - - - - - - - -
------------------GAGCGTCTCAGGCGGCGAAAACAG------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F T C V T P V G E L E R M T Q Y K D K S A Q F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S V P S G L L M Y P A L M A A D I L L Y K A D I
- - - - - - - M Y P A L M A A D I L - - - - - I
---------------------GATGGTGTTGCCCTTGCTCTTGCTCATCTTGCC---------------GGG
145146147148149150151152153154155156157158159160161162163164165166167168
V P V G E D Q T Q H I E L T R E I A R K F N H N
V P V G E D Q T Q H I E L T R E I A R K F - - -
AATCCGCAGGGCCTCTTTGTTGTAGACGGCCTTGGGCTCGGTGAACGTCTCGCCGAAGTTGTG---------
169170171172173174175176177178179180181182183184185186187188189190191192
F G E T F T E P K A V Y N K E A L R I P G V D G
- - - - - - - P K A V Y N - - - - - - - - - - -
---------------------CTCGATGTGCTGGGTCTG---------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q G K M S K S K G N T I G I L E P F G D I W Q K
- - K M S K S - - - - - - - - - - - - - - - - -
------GATGTCGGCGGCCAT---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L R V A P T D P A R V R R T D P G D P D K C L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G D Y H K L F S P P E T L E T V Y Q G C R T A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I G C V D C K K M L M T H I T E H L D P I Q T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A A Q L R A D P D Y V R D A L R Q G D Q E A R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330
I A S E V M D E V R Q K V G F L K L
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_trp_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E T L F S G I Q P S G I P T I G N Y I G A L K
- - T L F S G I Q P S G I P T I G N Y I . A L K
------CTTACGTCCTAAACCCATCGCTTTTTCCATTTTTTTGACAGTTTTAAATGAAGC---ATGTGCTTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q F V D V Q N D Y D C Y F C I V D Q H A I T M P
Q F V D V Q N D - D C Y F C I V D Q H - - - - -
ATCTCTACCTTGATCTAAAATATC---AAGTTTATCTGAGTTATAGAAACTTTCGTA---------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q D R L K L R K Q T R Q L A A I Y L A S G I D P
- - - - - - R K Q T R Q L A A I Y L A S . . . .
------------------TATTTCAGCAAGGTCGCCTTTGAATTTACCGTAACCTTCGCC------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K A T L F I Q S E V P A H V Q A G W M L T T I
. . A T L F I Q S E - - - - - - - - - - - - - -
------ATCTTTAATAGGCATGTCTGTTAA------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A S V G E L E R M T Q Y K D K A Q K A V E G I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A G L L T Y P P L M A A D I V L Y N T N I V P V
- - - - T Y P P L M A A D I V - - - - - I V P V
------------TGAAATAAAGTTTTTAGCGTTGTCATCACTTTT---------------TGGATCTTGTAA
145146147148149150151152153154155156157158159160161162163164165166167168
G D D Q K Q H I E L T R N L V D R F N S R Y N D
G D D Q K Q H I E L T R N L V D R F - - - - - -
ACTCATAACACGGCCACCGACTTTAGGCATACGAATTTCAGGTTTCACAAGGAC------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V L V K P E I R M P K V G G R V M S L Q D P T R
- - - - P E I R M P - - - - - - - - - - - - - -
------------AAGATTACGTGTTAATTC------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K M S K S D D N A K N F I S L L D E P N V A A K
K M S K S - - - - - - - - - - - - - - - - - - -
ATTGTAAAGAACAAT---------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K I K S A V T D S D G I I K F D R D N K P G I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N L I S I Y A G L T D M P I K D I E A K Y E G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G Y G K F K G D L A E I V K A F L V E F Q E K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E S F Y N S D K L D D I L D Q G R D K A H K A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329
F K T V K K M E K A M G L G R K R
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_trp_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T A T T A T A P Q T T Q P T G A A T R T I V
- - - - - - - - - - - - - - - - - - - - - - I V
------------------------------------------------------------------CTCCTG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V S G I Q P S G E L H L G N Y F G A I R Q H L E
V S G I Q P S G E L H L G N Y F . A I R Q H L E
CGCCCGCCGGCGGCCCTTGCGGGCCCCCTCGCGCAGCACGTCTATCAC---GTCCGGATGCTTCAGCAGCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L H E R Y E S Y F F I V N Y H A L T T I H D R E
L H E . . E S Y F F I V N Y H . L - - - - - - -
GCGCCGCCG------CGCCTCGGCAAAGTGCTCGTCGATGAGCCG---CAG---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L R R Y T F E A A V T Y L A L G F N P E K A A
- - R R Y T F E A A V T Y L A L . . . . . . A A
------GCCACCCCGCCGGTAGGCTTCGGCGATCCGGTTGCGCGTTTC------------------GATCAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L F V Q S D V P E V T E L A W I F Y N L V P V S
L F V Q S D - - - - - - - - - - - - - - - - - -
CGCAAACACGTTACAGCG------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T L E K G V A Y K D K V A Q G L P A N A G L F N
- - - - - - - - - - - - - - - - - - - - - - - N
---------------------------------------------------------------------GCC
145146147148149150151152153154155156157158159160161162163164165166167168
Y P V L Q A A D I L I Y G G T L V P V G A D Q K
Y P V L Q A A D I L - - - - - L V P V G A D Q K
ATCAATGCCCGGCACCACGGCCACCTCTTC---------------CGGAATGGGGAACAGCGGCCGATCCGG
169170171172173174175176177178179180181182183184185186187188189190191192
Q N I E I C R D I A Q R F N R T F C P P D R P L
Q N I E I C R D I A Q R F - - - - - - - - - - -
CGGGCAGAACGTCCGGTTGAAGCGCTGCGCGATGTCGCG---------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F P I P E P L I R E E V A V V P G I D G R K M S
- - - P E P L I R - - - - - - - - - - - - K M S
---------GAGCGTGCCCCCGTAGAT------------------------------------GAGCCCGGC
217218219220221222223224225226227228229230231232233234235236237238239240
K S Y G N T I G I F D E G K T L R K K V M S I V
K S - - - - - - - - - - - - - - - - - - - - - -
ATTGGC------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T D S T P L E A P K D P D R C N V F A L I K L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A D E E T R N R I A E A Y R R G G Y G Y G D A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K E L I R L I D E H F A E A R E R R R E L L K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P D Y V I D V L R E G A R K G R R R A Q E M M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354
Q V R D L V G L N Y A T Y R P E A S
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_trp_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E D P A A Q E V V V T P W T V E G D V N Y D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L I K H F G C Q A I D E K L L E R M E R L T R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K P H H F L R R G I F F S H R D L N L I L D A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E K G Q P F Y L Y T G R G P S S E S M H V G H L
- - - - - - Y L Y T G R G P S S E . M H V G H L
------------------CATAGGTACGTCGACGTTGGTGTTACCACCAAG---CAGCTGCTCCTTCTTATC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I P F M F T K W L Q D T F H V P L V I Q L T D D
I P F M F T K W L Q D T - - - P L V I Q L T D D
TGCGCCACCACCGCTGAAGGCGTGTTTGTTGATCTT---------CATCTTGGGGGTGTCTGTCAGAAAGAC
121122123124125126127128129130131132133134135136137138139140141142143144
E K F F F K D L T M D E I D K M T T E N L K D I
E - - - - - - - - - - - - D K M T T E N L K D I
GGC------------------------------------ACTAAGACCGGGGAAGAACTTGGAGTGGATAAC
145146147148149150151152153154155156157158159160161162163164165166167168
I A F G F D P K L T F I F R D F E Y V G R M Y R
I A F . . . . . . T F I F R D F E - - - - - - -
GGCTGGCTT------------------CGCCACGTCGCGCGTAAGACGGAA---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I V A R I E K A Y T A S Q V R G C F G F K M E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N C G R W M F P A I Q A A P S F S A A F P H I F
- - - - - M F P A I Q A A P S F - - - - - - - -
---------------AGGGAACATCCAGCGGCCGCAGTTGTCCTCCAT------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P Q E K G N V F C M I P Q A I D Q D P Y F R L T
- - - - - - - - - M I P Q A I D Q D P Y F R L T
---------------------------GCGTGCGACAATGCGATACATCCGTCCCACGTACTCAAAGTCCCT
241242243244245246247248249250251252253254255256257258259260261262263264
R D V A P R M G Y L K P A V I H S K F F P G L S
R D V A P R M - - - - P A V I H S - - - - - - -
GAAGATGAACGTCAGCTTCGG------------GGCAATGATGTCCTTCAA---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G S K G K M S S S T G A A V F L T D T P K M I K
- - - - K M S S S - - - - - - - - - - - - - - -
------------TGTCAAGTCCTTGAA---------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D K I N K H A F S G G G A D K K E Q L L L G G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T N V D V P M Q W L R F F L E D D E E L T R L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K D Y M L G R I M T G D V K K V L I Q Q I T S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V T A H Q E A R K K V T E A D V E L F T A V R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396
M G P A K E E A E S R K
- - - - - - - - - - - -
------------------------------------
Class I
Eukaryotes/Dictyostelium discoideum/amino acid sequences/Ddiscoideum_trp_aa
Eukaryotes/Dictyostelium discoideum/nucleotide sequences/Ddiscoideum_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K I D E V N F K D K T K V T V F S G M Q P T S
- - - - - - - - - - - - - - T V F S G M Q P T S
------------------------------------------TTTATTTGCAATTTTATTTGCTTTTTCAGA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S A L H L G N Y L G A M G N W L K I Q D L V T K
S . L H L G N Y L . A M G N W L K I Q D L - - -
TCC---TAATAAAATATCTCTAACTAA---CGGATTTGATTGATAATAATTAATTTTTTCACG---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N N K E E E E L L N L S E S S S S S S S S Q S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K I N E K H K L I F S I V D L H S L T S T K S L
- - - - - - K L I F S I V D L H - - - - - - - -
------------------ACCAGAGGTTTCAGATGCAATTGATAATAG------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S P K E L Q S N T I S V A I N Y L A C G I D P E
- - - - - Q S N T I S V A I N Y L A C . . . . .
---------------ACCAATGATTGTATCAGTTTTTGATTTTTTAATTTTTAATTT---------------
121122123124125126127128129130131132133134135136137138139140141142143144
K V I L F N Q S M V P A H S E L T W I L N C I T
. V I L F N Q S M - - - - - - - - - - - - - - -
---TGTTAATGAAATTCTTGAAATCTC---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S F S K L S N M I Q F K E K T K S S N E A S V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N G L L S Y P V L M A A D I L L Y K A T H V P V
- - - - S Y P V L M A A D I L - - - - - H V P V
------------GATATCTCTGGTGAATTCTAAATGCTGAGTTTG---------------TACATGTGTGGC
193194195196197198199200201202203204205206207208209210211212213214215216
G E D Q T Q H L E F T R D I A Q A F H S N F K S
G E D Q T Q H L E F T R D I A Q A F - - - - - -
TTTATACAATAAAATATCGGCAGCCATTAAAACTGGATATGATAAAAGTCCATT------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K F F P Y P S I I T S E Q S K R I M S L Q D G R
- - - - - P S I I T S - - - - - - - - - - - - -
---------------CTCTTTAAATTGAATCAT---------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L K M S K S D P L E I S R I S L T D T D D Q I K
- K M S K S - - - - - - - - - - - - - - - - - -
---AGTTAACTCTGAATG------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L K I K K S K T D T I I G I T Y D P I N R P D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S N L L S I A S E T S G I P I T D L Q S E F K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K S N A I F K E F L S N S I I K N I S P I R E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I N Y Y Q S N P K L V R D I L L Q G S E K A N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377
I A N K N L N I I K D I V G L Y H
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_trp_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E T D A T A E A A A V A Y E D I I T R F G A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P I T D D L L K R F E T V T G T K A H P M L R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G L F Y A H R D F E E F L S Y Y E K G H P I Y I
- - - - - - - - - - - - - - - - - - - - - - Y I
------------------------------------------------------------------TACATA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y T G R G P S S G A L H L G H L L P F I F T K Y
Y T G R G P S S G . L H L G H L L P F I F T K Y
TATACGGGTCGCGGCCCTTCATCGGGG---CTGCACCTTGGACACCTTCTACCCTTCATTTTCACCAAGTAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L Q D A F K C Y V V I Q I T D D E K F L R N R S
L Q D A - - - Y V V I Q I T D D E - - - - - - -
CTCCAGGATGCA---------TACGTAGTTATACAGATCACGGACGACGAA---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L S Y A E V D S Y T R E N I K D I I A C G F D P
- - - - - - D S Y T R E N I K D I I A C . . . .
------------------GATAGCTATACCAGGGAAAACATCAAGGACATTATTGCATGC------------
145146147148149150151152153154155156157158159160161162163164165166167168
D K T F I F I N S Q Y L S L K N R Y R F S C L V
. . T F I F I N S Q - - - - - - - - - - - - - -
------ACGTTTATTTTTATCAATTCGCAG------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D R M L P I S Q L R A S F G F S N D A N V G Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A F P P K Q M L P V Y S T Y F D G L P F T R V P
A F P P K Q M L P V Y - - - - - - - - - - - - -
GCGTTCCCCCCGAAACAGATGCTACCTGTATAC---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L P V G T G N E D A A D A V S T K K A S K K T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K K D A V L S P V H V V E E L F P D S K R Y Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A M C L I A S G I E Q D P Y F R L A R D L A P R
- - - L I A S G I E Q D P Y F R L A R D L A P R
---------CTTATCGCCTCCGGTATCGAGCAGGACCCTTACTTTCGATTGGCTCGCGACCTGGCCCCGCGT
289290291292293294295296297298299300301302303304305306307308309310311312
M G H P K N A Y L L G K F L P G L Q G S G T K M
M - - - - N A Y L L G - - - - - - - - - - - K M
ATG------------AATGCGTACTTGCTAGGG---------------------------------AAGATG
313314315316317318319320321322323324325326327328329330331332333334335336
S A S D P N S A I Y L T D T P A Q I K N K I N R
S A S - - - - - - - - - - - - - - - - - - - - -
AGCGCCTCG---------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y A F S G G R D T E E E H R A F G A D L S V D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S V R Y L E V F M K D D A E L E K L K A D Y K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G K L L T G E V K A T L I G I L Q G L I K E H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429
E R R D K V D T T M I E S F T V K K E L Q
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_trp_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T K N P I L F S A L C V V K G S I S T L F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L S G K V S K L K F K N E K V S F N Y S L S K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I E M N D D T L E E L N N I I S Y K I K E N S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F Q V F K I L S K E A A S I Y G S E H L E S D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A I P D D I E L R I V T L R N F Y L S A T R N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V L R N T K D I G N V L I E N I S L D H E N S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L L V N F K V E N P L V R A S E E N F K D L C C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E E Y S I Q D I K D G K F I V P S L E D S L P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S I N L D I I G D E L V N P W E V K A D N A Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I D Y N K L I D K F G C K L I T K D M I E R M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R L T G Q K A H H F F R R N I F L S H R D F E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I L D V Y E K G E L F Y L Y T G R G P S S E S L
- - - - - - - - - - - Y L Y T G R G P S S E . L
---------------------------------TATTTGTACACTGGAAGAGGTCCATCGTCTGAA---TTG
289290291292293294295296297298299300301302303304305306307308309310311312
H V G H L V P F L F T K Y L Q D T F K V P L V I
H V G H L V P F L F T K Y L Q D T - - - P L V I
CATGTAGGGCATCTAGTCCCATTCCTTTTTACTAAATATCTTCAAGACACA---------CCATTAGTAATC
313314315316317318319320321322323324325326327328329330331332333334335336
Q L T D D E K F I F K S N L T L E E T H N Y A Y
Q L T D D E - - - - - - - - - - - - - H N Y A Y
CAACTGACTGATGATGAA---------------------------------------CATAATTACGCATAT
337338339340341342343344345346347348349350351352353354355356357358359360
E N M K D I I A C G F D P E L T F I F T N L E Y
E N M K D I I A C . . . . . . T F I F T N L E -
GAGAATATGAAAGATATCATTGCATGT------------------ACTTTCATTTTCACAAATCTTGAG---
361362363364365366367368369370371372373374375376377378379380381382383384
I A E L Y P D I L R I E K K I S C S Q I K S I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G F K D S C N V G K F A F P A V Q A A P A F S S
- - - - - - - - - - - A F P A V Q A A P A F - -
---------------------------------GCTTTCCCAGCAGTTCAAGCTGCTCCAGCCTTT------
409410411412413414415416417418419420421422423424425426427428429430431432
S F P H I F G G R T D I H C L V P H A I D Q D P
- - - - - - - - - - - - - - L V P H A I D Q D P
------------------------------------------TTGGTGCCCCATGCGATTGATCAGGATCCA
433434435436437438439440441442443444445446447448449450451452453454455456
Y F R M V R D V A P R L G Y L K P S S I H S I F
Y F R M V R D V A P R L - - - - P S S I H S - -
TACTTTAGAATGGTCAGAGACGTTGCCCCAAGGCTT------------CCTTCATCAATCCACTCT------
457458459460461462463464465466467468469470471472473474475476477478479480
L P S L Q G S Q T K M S A S V Q N S S I F V N D
- - - - - - - - - K M S A S - - - - - - - - - -
---------------------------AAGATGAGTGCAAGT------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N E E S I R N K I M K Y A F S G G Q A T E E E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R R L G A N L D V D V S W Q Y L R F L M E D D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K L E E I G K K Y S S G E M L S G E I K S I L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q E L V K L T K N H Q K N R E A I N D D V I A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593
F T N K S R E Q L L K L F I N K K
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_trp_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N R L R I L S G V Q P T G S L H I G N W L G A
- - - - R I L S G V Q P T G - L H I G N W L . A
------------CTTAAGAAAACCTAAAGCAGAACGCACCCT---TAGAGTTGTATCAGCTACTGA---AGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I R N W V N L Q N T H E T Y V C V V D L H A I T
I R N W V N L Q N T - E T Y V C V V D L H - - -
TTTTTGGGCACCCTCTTTTAGAATATTATC---ATATGTACGATCATTTATTATTTCGTTATA---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M S Y D P I K L A E D T R N T A A L Y L A C G I
- - - - - - - - A E D T R N T A A L Y L A C . .
------------------------AGCATCTATGAGTAATTGTTTAAAATTACCCCAACCCATTTC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N P E H S T V F V Q S H V R A H S E L C W L L N
. . . . S T V F V Q S H - - - - - - - - - - - -
------------TGTTTCACGTCCCTTTCCAGATAA------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C L T P L N W L E R M I Q F K E K S I K Q G S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V S I G L L D Y P I M M A A D I L L Y D A D L V
- - - - - - D Y P I M M A A D I L - - - - - L V
------------------ATTAATACGACTATTATCATCAGGATGACTCTT---------------ACCATC
145146147148149150151152153154155156157158159160161162163164165166167168
P V G E D Q K Q H L E L A R D I A Q Q R V N S R
P V G E D Q K Q H L E L A R D I A Q Q R - - - -
TACAAGACTCATAATCCTTGCCCCTTCTGACATAATTAGAGGCTCAGGGACTTTGACTAT------------
169170171172173174175176177178179180181182183184185186187188189190191192
F G K D E N V I V K V P E P L I M S E G A R I M
- - - - - - - - - - - P E P L I M - - - - - - -
---------------------------------TATATCTCTCGCTAATTC---------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S L V D G R S K M S K S H P D D N S R I N L L D
- - - - - - - K M S K S - - - - - - - - - - - -
---------------------ATCATAAAGCAGGAT------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S P D L I K K K I K R A K T D S N I G L E F T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T D R P E A D N L L G I Y A I L S G K G R E T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A I E C S E M G W G N F K Q L L I D A T I E S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K P I Q N H Y N E I I N D R T Y M D N I L K E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A Q K A N S V A D T T L Q R V R S A L G F L K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338
I G
- -
------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_trp_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_trp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E D E T I Q N I T P W E A Q V V T D N K T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S I N Y E K I I T Q F G C K E Y H E E L T K K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q E M T G V P P H F Y F L R N I V F A H R D F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I L L E K L K S K S F Y L Y T G R G P S S K S M
- - - - - - - - - - - Y L Y T G R G P S S K . M
---------------------------------TTCTTTTCCGCCACTAAAAGCATATTTTCGTAT---TTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H L G H V I P F Q L C K Y F Q D T F N C P L V I
H L G H V I P F Q L C K Y F Q D T - - - P L V I
AGCAATTTGAGCCGGTGTGTCGGTTAAAAAAATTGAACTTGTAGTATCACT---------CTTCCTATTAAC
121122123124125126127128129130131132133134135136137138139140141142143144
Q M T D D E K F L F K D Q S F E E S T K Y C A E
Q M T D D E - - - - - - - - - - - - T K Y C A E
TCCTTTTAAATCGGGCAA------------------------------------CATTACGCTAGCTTTGTC
145146147148149150151152153154155156157158159160161162163164165166167168
N I K D I I A F G F N P K L T Y I F S N V E S S
N I K D I I A F . . . . . . T Y I F S N V E - -
TCTAGCTAATCTAAAATAAGGATC------------------TATAAGACACATAGCGCCTTTGTT------
169170171172173174175176177178179180181182183184185186187188189190191192
H L F E K N T L K I A K S I S L N E A C K I F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F D N N S N I G M I G F P A K E I A P C F A S S
- - - - - - - - - - G F P A K E I A P C F - - -
------------------------------TAGCGAAATTGATTTAGCAATTTTTAATGTATT---------
217218219220221222223224225226227228229230231232233234235236237238239240
F E F L N K G A M C L I P C A V D Q D P Y F R L
- - - - - - - - - - L I P C A V D Q D P Y F R L
------------------------------ATATGTTAACTTTGGATTAAAACCAAATGCTATGATGTCCTT
241242243244245246247248249250251252253254255256257258259260261262263264
A R D K A S V M K E P K P T T L Y V S L L P D L
A R D K A S V M - - - - P T T L Y V - - - - - -
AATATTTTCTGCGCAGTATTTAGT------------TGACTGATCTTTAAATAA------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K G V N R K M S A S D T T S S I F L T D T P A Q
- - - - - K M S A S - - - - - - - - - - - - - -
---------------AGGACAATTAAATGT------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I A K K I R K Y A F S G G K E T L E E H K R L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G D T A V D I S Y Q Y L R Y F Y D D N I D L E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I K N A Y E K G E M S T G D I K N K C I D V L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K F V K D Y Q E R R N S I T E E L F Q E F C S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385
L
-
---
Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_tyr_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T P E E R L K L I T R N T V E I V T L E E L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S K I E A G E K L K G Y L G F E P S G L F H I G
- - - - - - - - - K G Y L G F E P S G L F H I G
---------------------------AAAGGCTATCTAGGGTTTGAGCCTAGTGGCCTCTTCCACATAGGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W L V W A N K V K D L V D A G I E F Y L L A A T
W L V W A N K V K D L V D A - - E F Y L L A A T
TGGCTTGTCTGGGCTAATAAGGTCAAAGATCTAGTAGATGCC------GAGTTCTATCTGCTAGCTGCTACG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W H A W I N D K L G G D M E L I R K A A R H V V
W H . . . . . . . . . . . . . . . K A A R H V V
TGGCAC---------------------------------------------AAAGCTGCACGGCATGTAGTA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D V L E A I G V D K A K L K V V D A E D L V S D
D V L E A I . . . . . . L K V V D A E D - - - -
GATGTGCTAGAGGCTATA------------------CTAAAGGTTGTTGATGCAGAGGAT------------
121122123124125126127128129130131132133134135136137138139140141142143144
K E Y W A I L L R V A K N N T L A R I K R A L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I M G R R A E E A E L D F S K L I Y P A M Q V T
- - - - - - - - - - - - - - - - I Y P A M Q V T
------------------------------------------------ATATACCCGGCGATGCAAGTCACG
169170171172173174175176177178179180181182183184185186187188189190191192
D I F Y L D L D I A L G G L D Q R K A H M L A R
D I F - - - - - I A L G G L D Q R K A H M L A R
GACATATTC---------------ATAGCTCTAGGTGGGCTTGATCAACGCAAGGCACACATGCTGGCCAGA
193194195196197198199200201202203204205206207208209210211212213214215216
D T A E K L G R K K P I A I H T P L L T G L Q G
D T A E K L - - - - P I A I H T - - - - - - - -
GATACTGCGGAGAAGCTT------------CCTATAGCTATTCATACA------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I G R M N P S M V D E E Q H A V E F K M S K S K
- - - - - - - - - - - - - - - - - - K M S K S -
------------------------------------------------------AAGATGAGTAAGTCT---
241242243244245246247248249250251252253254255256257258259260261262263264
P E T A V F V Y D S P E D I E K K I L R A Y C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A R E V K F N P I M E I N K Y L L F A R P G F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L V I E R P E K Y G G T I I V E S Y E E L E K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y I E G R L H P L D L K K A T A K A L I E M L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P V R R Y F E Q N R E A R E T L E E L K K A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362
T R
- -
------
Class I
Archaea/Thermoplasma volcanium/amino acid sequences/Tyr_Arc_T_volcanium_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L I D K L M K N T R E I V T L E D A Q K L D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K A G V K S Y I G I E P S G I P H V A T A V M W
- - - - K S Y I G I E P S G I P H V A T . V M W
------------TTTGAGCTCAGTTGGTGCAATTTTGCCGGATATATAGTCATTCTGGAA---ATCAACATT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P R K L A E L Q D D I K I Y V L L A D W H A M I
P R K L A E L Q D - - K I Y V L L A D W - - - -
TTCTATTCGAACATTTCCAGATGGTTT------GATTATATCTCTTCCATAGTACGGGAT------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N N K L H G D L D L I R K G G E L L K R S F M A
- - - - H . . . . . . . K G G E L L K R S F M A
------------AAG---------------------GGGTGGGCAGAAAGCAGCATTGACTTTTCTTTCAAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E G L T K A E Y L W A S Q L V S S S N Y W E M F
E . . . . A E Y L W A S Q - - - - - - - - - - -
GTC------------ATTTATGAGAATGGCCGAGTTCGG---------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I K T A K R S T L K R L T R A L P I M G R T E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D A E K D F S M Y I Y P I M Q V T D I F Y L D V
- - - - - - - - - I Y P I M Q V T D I F - - - -
---------------------------ATGTCGCTGATCCATCCCTCCAAATGCAATATC------------
169170171172173174175176177178179180181182183184185186187188189190191192
D I A F G G M D Q R H A H M L A R D I A D K M K
- I A F G G M D Q R H A H M L A R D I A D K M -
---TATGTCGGTAACCTGCATTATAGGGTAAATGTACATACTAAAGTCTTTTTCTGCATCGGCCTCAGT---
193194195196197198199200201202203204205206207208209210211212213214215216
V K K A V S V H G Y L L S S L K G N T R M D N F
- - - A V S V H G - - - - - - - - - - - - - - -
---------CGGAAGGGCTCTTGTGAG---------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V K M S K S D P N S A I L I N D E Y K D I E R K
- K M S K S - - - - - - - - - - - - - - - - - -
---ATTCGAAGAAGAAAC------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V N A A F C P P E K V D G N P L A E I M K Y V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I P Y Y G R D I I I E K P S G N V R I E N V D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F Q N D Y I S G K I A P T E L K K A M I P I L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331
E M I E P A R K V A Y D M D L S I F S
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_tyr_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D V E E R L K L V T R N A V E V V T E E E L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q L L E E K E E P V A Y V G F E P S G K V H L G
- - - - - - - - - V A Y V G F E P S G K V H L G
---------------------------GACGAAGTCCCGCTCCAGCTCTTCGTAACTGGTGTAGGTGACATC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H K L V I D K M I D L Q E A G F H V I I L L A D
H K L V I D K M I D L Q E A - - H V I I L L A D
GCCACCGTATTTCTCCGGACGTTCGATCGTGACCTCATCGTA------GAATATGAAGTACCGATAGATCTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L H A Y L N E K G T L E E V R E L A D Y N R R C
L H . . . . . . . . . . . . . E L A D Y N R R C
GAGGAT---------------------------------------TCGAAGCTTTTCCCGGATGACCTCCGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F L A M G L D P N K T E F V L G S E F Q L D E D
F L A M . . . . . . T E F V L G S E - - - - - -
CTCGTCGTCGAC------------------GCTGGAAGACATCTTCTCGTCTCC------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y A L D V Y R M A R H T T M R R A R R S M D M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A R S E E N P P V S Q V V Y P L M Q A L D I V H
- - - - - - - - - - - - V Y P L M Q A L D I V -
------------------------------------TAGGTGCACGATGTCCAGTGCCTGCATAAGAGG---
169170171172173174175176177178179180181182183184185186187188189190191192
L N V D L A V G G L E Q R K I H M L A R D V L P
- - - - L A V G G L E Q R K I H M L A R D V L P
------------TACCGGAGGGTTTTCCTCGCTCCTAGCGATCATATCCATGCTGCGTCGGGCTCGGCGCAT
193194195196197198199200201202203204205206207208209210211212213214215216
K L G Y D S P T C L H T P I I H G L D G D E K M
K L - - - - P T C L H T - - - - - - - - - - K M
GGTAGT------------CCGGTACACGTCCAGCGC------------------------------GAGGAC
217218219220221222223224225226227228229230231232233234235236237238239240
S S S K N N F I A V D D E P E V I R E K L R K A
S . . . . . . . . . . . . . . . . . . . . . . .
GAA---------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y C P A R E A E G N P I L E I Y R Y F I F R E Y
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D E V T I E R P E K Y G G D V T Y T S Y E E L E
. . . . . . . . . K . . . . . . . . S - - - - -
---------------------------GAC------------------------ACC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
R D F V D G E L H P L D L K E N A A G Y L S E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324
L K P V R K A V S A P S
- - - - - - - - - - - -
------------------------------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_tyr_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D T Y A R V I R N T V E V V T D E E L R S L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D R P V R K V Y A G Y E P S G E I H L G H L V T
- - - - - K V Y A G Y E P S G E I H L G H L V T
---------------AAGGTCTACGCAGGATATGAGCCAAGTGGAGAGATCCATCTTGGACACCTGGTTACT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I N K L I D L R D A G F E V T V L L A D L H A F
I N K L I D L R D A - - E V T V L L A D L H . .
ATCAATAAACTGATAGACCTGAGAGATGCA------GAAGTCACTGTTCTCCTTGCCGATCTCCAC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L N R K G T M E E V K K L A E Y N R R C F E G L
. . . . . . . . . . . K L A E Y N R R C F E G L
---------------------------------AAACTTGCAGAATATAACCGCCGCTGTTTTGAAGGGCTG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G L T D I K Y V L G S S F Q L S P E Y Q I L V H
. . . . I K Y V L G S S - - - - - - - - - - - -
------------ATCAAATATGTGCTCGGGTCCAGT------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E L S Q A I T L N R A K R S M D E V G R Q M D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P T V S Q M V Y P I M Q M A D I A M L G V D A A
- - - - - - V Y P I M Q M A D I A - - - - - A A
------------------GTATACCCCATTATGCAGATGGCTGATATTGCC---------------GCTGCA
169170171172173174175176177178179180181182183184185186187188189190191192
L G G I D Q R K I H M L A R E Y L P S K N Y P S
L G G I D Q R K I H M L A R E Y L P S K - - - -
CTTGGCGGAATTGATCAGCGGAAGATCCATATGCTGGCTCGTGAGTATCTGCCATCGAAA------------
193194195196197198199200201202203204205206207208209210211212213214215216
P V C I H V P I L Q G L D G K K M S S S Q G N Y
P V C I H V - - - - - - - - - K M S S S - - - -
CCGGTCTGTATTCATGTC---------------------------AAGATGTCCTCTTCC------------
217218219220221222223224225226227228229230231232233234235236237238239240
I S V A E S E E D I R K K M K K A F C P P E V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D N P V L Q V L Q H H I F P R L D T V T I E R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E K F G G N R T F G S Y E E M E Q A Y A K G E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H P A D L K T A V A E S L I T I L A P V R E Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313
K
-
---
Class I
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_tyr_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D D S L K T I T R D V L E V I T P E E L M D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L K K D E P V V Y T G Y E P S G R I H L G H A L
- - - - - - V V Y T G Y E P S G R I H L G H A L
------------------GCTACTGGAGTACATCTCAAGCAGCTCATCGAGTTCCAGTTCCAGGTCGCCCCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T V R K L R E L Q D A G F R V K I L L A D Y H A
T V R K L R E L Q D A - - R V K I L L A D Y H .
GAATTTCTCAGGTCTCCTTATGGTCATCATTCC------TGGCATTATGAAGTACTTCACGATTTCGAT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y L N G K G S M E R I R E L A D Y N Q K C F L A
. . . . . . . . . . . . E L A D Y N Q K C F L A
------------------------------------CTTCTTAACCTTCTCCCTTATTTCATCGGGGGAATC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L G L S P E R T E F I L G S S F Q T E P E Y T D
L . . . . . . T E F I L G S S - - - - - - - - -
ATC------------------CTTACTTGATGACATCTTTTCAGA---------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L V Y R L A L I T T L L R A K R S M A Q I T R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S R D H K V A E V I Y P L M Q V I D M V Y L G V
- - - - - - - - - I Y P L M Q V I D M V - - - -
---------------------------GCCCAGGTAAACCATGTCTATGACCTGCATTAA------------
169170171172173174175176177178179180181182183184185186187188189190191192
D V A L G G M E Q R K I H M L A R E N L P R L G
- V A L G G M E Q R K I H M L A R E N L P R L -
---TGCAACCTTATGGTCCCTGGATTCCCTGGTTATCTGGGCCATACTCCTTTTTGCTCGCAGGAGGGT---
193194195196197198199200201202203204205206207208209210211212213214215216
F D A P V C I H T P L L H G T D G S E K M S S S
- - - P V C I H T - - - - - - - - - - K M S S S
---------CAGTCTGTAGACCAGGTC------------------------------TCCCAGTATGAACTC
217218219220221222223224225226227228229230231232233234235236237238239240
K G N F I A V D D S P D E I R E K V K K S Y C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
M G E T E G N P I I E I V K Y F I M P E Y G M M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T I R R P E K F G G D L E L E L D E L L E M Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S S E L H P L D L K N A V S D Y L V D M L E P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319
R E Y M E G V
- - - - - - -
---------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_tyr_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H L I E K I Y K N T R E V V T R E D A E R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G K S D I K S Y I G I E P S G I P H I A T A V M
- - - - - K S Y I G I E P S G I P H I A T . V M
---------------GAGATCTGCCGGTTGAATCTCTCCCCTTTGGTAAGCCTGATCGAAGTT---TACGCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W P R K L A E I Q D D I K V T V L L A D W H A M
W P R K L A E I Q D - - K V T V L L A D W - - -
GTCGAGATTTATTACGCCATTGGATCCGTG------AATACTCTTTCCGTAATAAGGTATTAT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I N N K L H G D L D L I R K G G E I L R K T F Q
- - - - - H . . . . . . . K G G E I L R K T F Q
---------------AGG---------------------CGGGCAGTAAGCTGCATTTATCTTCCTTTCGAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E G L T K A D Y V W A S D L V D S S E Y W R M
A E . . . . A D Y V W A S D - - - - - - - - - -
ATCTTC------------CACCAGTATTGCTGAATTCGGATC------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F I D T A K R S T L K R V I R S L P I M G R N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T D A E K D F S M Y L Y P I M Q V T D I F Y L D
- - - - - - - - - - L Y P I M Q V T D I F - - -
------------------------------CCTCTGATCCATTCCGCCGAATGCCATGTCCAC---------
169170171172173174175176177178179180181182183184185186187188189190191192
V D M A F G G M D Q R H A H M L A R D I A E K M
- - M A F G G M D Q R H A H M L A R D I A E K M
------GTCGGTGACCTGCATTATCGGATAGAGATACATGCTGAAGTCCTTCTCGGCGTCGGTCTCATTCCT
193194195196197198199200201202203204205206207208209210211212213214215216
K R K K V V S V H G F L L S S L K G N A R M D N
- - - - V V S V H G - - - - - - - - - - - - - -
------------AAGTGATCTTATCACACG------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F V K M S K S D P N S A I L V T D H M E D I E R
- - K M S K S - - - - - - - - - - - - - - - - -
------GGAAGAGTCTACAAG---------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K I N A A Y C P P Q Q V E G N P V A E I M K Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I I P Y Y G K S I E I H G S N G V I N L D S V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N F D Q A Y Q R G E I Q P A D L K H K V A T I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332
N E M V E P A R R S L E G L D L S E F Q
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_tyr_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E T K L E N I L K N T S E V V S E E E L K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L N E I S K G N D K I A Y I G F E P S G R I H L
- - - - - - - - - - I A Y I G F E P S G R I H L
------------------------------ATAGCCTATATCGGATTTGAGCCAAGTGGAAGAATACATTTA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G H Y L Q I K K M I D L Q N A G F K I I I L L A
G H Y L Q I K K M I D L Q N A - - K I I I L L A
GGGCACTACCTCCAAATAAAAAAAATGATAGATTTGCAAAATGCA------AAAATTATTATTCTTCTTGCT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D L H A Y L N Q K G T M E E I K E L A E Q N K K
D L H . . . . . . . . . . . . . E L A E Q N K K
GACCTCCAT---------------------------------------GAATTGGCAGAACAGAACAAAAAA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V F D A I G L N A T Y I Y G S E F Q L K P E Y N
V F D A I . . . A T Y I Y G S E - - - - - - - -
GTATTTGATGCCATA---------GCCACATATATATATGGAAGCGAA------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L D L Y K V A V N T T L K R A R R S M E V I A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E D D N P K V A G V V Y P L M Q V I D I K H L N
- - - - - - - - - - V Y P L M Q V I D I K - - -
------------------------------GTTTATCCACTTATGCAGGTAATAGATATTAAA---------
169170171172173174175176177178179180181182183184185186187188189190191192
A D V A V G G M E Q R K I H M L A R E I L P S M
- - V A V G G M E Q R K I H M L A R E I L P S M
------GTGGCCGTTGGAGGAATGGAACAGAGAAAAATACACATGCTTGCAAGGGAAATTTTACCATCTATG
193194195196197198199200201202203204205206207208209210211212213214215216
D Y K A P V C I H N P V L T G L D G E G K M S S
- - - - P V C I H N - - - - - - - - - - K M S S
------------CCAGTTTGCATACATAAC------------------------------AAAATGTCCTCC
217218219220221222223224225226227228229230231232233234235236237238239240
S K G N F I A V D D D D A T I K S K I K K A Y C
S - - - - - - - - - - - - - - - - - - - - - - -
TCA---------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P I G E V E G N P I L E I A K Y Y L N Y P I T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E R P E K F G G N L I I N S Y N G L E E L Y K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D L H P M D L K N A V V K G I I E M L T L I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317
G P N S E
- - - - -
---------------
Class I
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_tyr_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D I E E R I N L I A Q K P T E E I L T I D R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K Q Y L E Q G I D L N H Y I G F E I S G F V H L
- - - - - - - - - - N H Y I G F E I S G F V H L
------------------------------TGCTACATACTCTTTTAAATCTAATGGATGTATTTGCTTTTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G T G I I S M L K V R D F Q K A K V K T T L F L
G T . I I S M L K V R D F Q K A - - K T T L F L
AGCATA---TTCTTTTAATTGTTCGACATTATCAAATTCCATTGTTTG------TTTTTTGTTTTCTATTAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A D Y H S W I N K K L G G D L E T I R K V A K G
A D Y H . . . . . . . . . . . . . . . K V A K .
TATGGGCTCTTT---------------------------------------------TAGCTCTATTTC---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y F A E A L K V S L K T V G G D P D E V K V V L
Y F A E A L K V S . . . V - - - - - - - K V V L
TATGGGGCAATAAGCCTTTCTAATTTT---------ATC---------------------TATTGCAGTCTC
121122123124125126127128129130131132133134135136137138139140141142143144
G S E L Y E K L G I E Y L E N I I K I S M N T T
G S E - - - - - - - - - - - - - - - - - - - - -
GGGTTTAGA---------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L N R I K K G I T I M G R K Q G E S I S F A Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L Y V P M Q V A D I Y S L N V N L A H G G I D Q
L Y V P M Q V A D I Y - - - - - L A H G G I D Q
CTTATAACCAAAAGCATCTGAAACCTCTATGGC---------------CCTTTGGTCTATTCCCCCATGGGC
193194195196197198199200201202203204205206207208209210211212213214215216
R K A H V I A I E V S D A F G Y K P I A V H H H
R K A H V I A I E V S D A F - - - P I A V H H -
TAAATTAACATTTAAGCTATATATATCTGCAACTTGCATAGG---------TAATTGGGCGAAACTTAT---
217218219220221222223224225226227228229230231232233234235236237238239240
L L L G M H I D E N I R Q K L L E A K K T N N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E L F E D S V I D I K M S K S K P E T A I F I H
- - - - - - - - - - K M S K S - - - - - - - - -
------------------------------TTTCTCATACAATTC---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D T P E D I R R K I R K A Y C P I G E I E L N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I I E L V E Y V I Y P I L K E P I V I E N K K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H Q T M E F D N V E Q L K E A Y A K K Q I H P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D L K E Y V A E K L I E I L E P A R K Y F L E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376
K G N K Y L E E L K N L Q I T R
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_tyr_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N I D E K I K L I T R N T D E V I T V D E L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K K L E E N S K L K G Y I G F E P S G L F H I G
- - - - - - - - - K G Y I G F E P S G L F H I G
---------------------------TCTTGCCGTAGCTAGCTTTAAGTCTAACGGATGCAATTTACCTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W L I W A Q K L K D L I K A G V D M S I L V A T
W L I W A Q K L K D L I K A - - D M S I L V A T
AATGAAAATGCGTTCTAGTTCTTCGTATGATTTTATCTCTAT------ACCATACTTGGCATCTCTCTCTAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W H A M I N D K L G G D L E K I K L A G K Y A L
W H . . . . . . . . . . . . . . . L A G K Y A L
TTTCAA---------------------------------------------AACAGGGTTATCGTTTACTAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E V L E G F G V D M S K L K V V Y A E D L V E N
E V L E G F . . . . . . L K V V Y A E D - - - -
TCCCTTTGGACAATATGA------------------AACTAATTCTGGTGAGTCATGAAT------------
121122123124125126127128129130131132133134135136137138139140141142143144
I D Y W S L V V K V A K N T S L A R M K R A L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I M G R R S E E A E L D T S K L I Y P A M Q V S
- - - - - - - - - - - - - - - - I Y P A M Q V S
------------------------------------------------TTTTTTCCTTTGTAATTTTTCTGC
169170171172173174175176177178179180181182183184185186187188189190191192
D I F F Q D L D I A L G G T D Q R K A H M L A R
D I F - - - - - I A L G G T D Q R K A H M L A R
CACGTCTCT---------------TTTTCTCTGATCTGTACCACCTAAAGCTATGTCAAGATCCTGGAAGAA
193194195196197198199200201202203204205206207208209210211212213214215216
D V A E K L Q R K K V I A I H T P L L V G L Q G
D V A E K L - - - - V I A I H T - - - - - - - -
TATGTCGGAAACTTGCAT------------TAATTTTGAGGTATCAAG------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G Q R M N T E G L E E D D Y L A T I K M S K S K
- - - - - - - - - - - - - - - - - - K M S K S -
------------------------------------------------------TACCACTAAGCTCCA---
241242243244245246247248249250251252253254255256257258259260261262263264
P E T A I F I H D S P E L V E S K L K N S Y C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K G V V N D N P V L Q I N K Y I I F G E Q G V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L K I E R D A K Y G G D I E I K S Y E E L E R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F I E G K L H P L D L K L A T A R K L N D I L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P I R K R I S S K S Q F V D L I S S I E K S I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361
R
-
---
Class I
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_tyr_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D R L E L I R R N V Q E I V T E E E L E G L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K N K E A P R A Y V G Y E P S G K I H M G H V L
- - - - - - R A Y V G Y E P S G K I H M G H V L
------------------TATAAAGTTGCTCTCCATCTCAGCATAGCTGTGGTATGTGATGTCTCCCCCGAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T V N K L I D L Q K A G F K I T V L L A D V H A
T V N K L I D L Q K A - - K I T V L L A D V H .
TTTTTCCGGCCTTTCAATGACAACTGTCTCGTA------GAAGATGTGGTAGCGGAAAAGAGCAAGGAT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y L N K K G T L E E V R K I A D Y N R R C F I A
. . . . . . . . . . . . K I A D Y N R R C F I A
------------------------------------CTTAAACTTCCTGTAGATATCTTCTCCCGTATCGTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L G L D E E Q T D F V Y G S D F Q L G A E Y M L
L . . . . . . T D F V Y G S D - - - - - - - - -
TAT------------------TGAAGAAGCCATCTTTGTTCCGTC---------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N V L K L S R A V T L N R A K R S M D E V G R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M D D P T V S Q M V Y P L M Q A I D I A L L E V
- - - - - - - - - V Y P L M Q A I D I A - - - -
---------------------------CAGGGCAATGTCAATAGCCTGCATCAGGGGATA------------
169170171172173174175176177178179180181182183184185186187188189190191192
D V A V G G I D Q R K I H M L A R E N L K S L G
- V A V G G I D Q R K I H M L A R E N L K S L -
---GGTGGGGTCGTCCATTGCGCGTCCTACTTCGTCCATGCTTCTCTTTGCCCTGTTGAGGGTGACTGC---
193194195196197198199200201202203204205206207208209210211212213214215216
F E T P I C I H T P I L L G L D G T K M A S S K
- - - P I C I H T - - - - - - - - - K M A S S -
---------GAGCACGTTTAACATGTA---------------------------GTATACGAAATCGGT---
217218219220221222223224225226227228229230231232233234235236237238239240
D N F I S I D D T G E D I Y R K F K K A F C K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G D V E E N P I L A L F R Y H I F P R Y E T V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I E R P E K F G G D I T Y H S Y A E M E S N F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E E K V H P M D L K N A A A K Y I N E I L D P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317
R K V L L
- - - - -
---------------
Class I
Archaea/Staphylothermus marinus/Smarinus_tyr_aa
Archaea/Staphylothermus marinus/Smarinus_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D V N D K I K L A S R N T V E V I T L E D L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K V F E E K E H P R G Y I G F E P S G L V H V G
- - - - - - - - - R G Y I G F E P S G L V H V G
---------------------------TGCTTCAGCTGTAGCGTTTTTTAGGTCTAGCGGATGTATTTTTCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W L V W M N K V R D L L E A G V D F Y I L E A T
W L V W M N K V R D L L E A - - D F Y I L E A T
CTCAACATATAGTTTCTCTAGTTCATCGTATGATTCAATAGT------TCCACCATATTTTTCCGGACGATC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W H A Y I N D K L G G D M D L I R K A A R L V R
W H . . . . . . . . . . . . . . . K A A R L V R
TATGTA---------------------------------------------TATTATCGGGTTAAACATTGT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K V M E G F G I D V S K I K F V D A E E L V S D
K V M E G F . I - - - - - K F V D A E E - - - -
TTCGCGTGGAGGACAATA---TTT---------------TATTTCTTCCGGTGGATCATG------------
121122123124125126127128129130131132133134135136137138139140141142143144
K D Y W G I L V R S A K N V S L A R V K R A L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I M G R K S E E A E T D F S K L I Y P L M Q V S
- - - - - - - - - - - - - - - - I Y P L M Q V S
------------------------------------------------AGGTTTTTTTCTACCTATTTTCTC
169170171172173174175176177178179180181182183184185186187188189190191192
D I F Y L D L D I A L G G T D Q R K A H M L A R
D I F - - - - - I A L G G T D Q R K A H M L A R
AGCAATATC---------------GGCTTTTCTCTGATCAGTTCCTCCCAACGCAATATCTAGGTCTAAATA
193194195196197198199200201202203204205206207208209210211212213214215216
D I A E K I G R K K P V A I H T P I I T G L K G
D I A E K I - - - - P V A I H T - - - - - - - -
GAATATGTCACTGACTTG------------TATTAGTTTTGAAAAATC------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P G R R M D I V G E I D E V Y A T H K M S K S K
- - - - - - - - - - - - - - - - - - K M S K S -
------------------------------------------------------ACGGACAAGTATTCC---
241242243244245246247248249250251252253254255256257258259260261262263264
P E T A I F V H D P P E E I R A K I R K A Y C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P R E T M F N P I I E I N K Y L L F A T P G F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L Y I D R P E K Y G G P I T I E S Y D E L E K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y V E G K I H P L D L K N A T A E A L N K L L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P I R K K L R T D P E A R E I L E T L L K T K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362
T R
- -
------
Class I
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_tyr_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D T H E L V T R N A A E V V T E E E V E A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D D P E G K R A Y V G Y E P S G V L H L G H L L
- - - - - - R A Y V G Y E P S G V L H L G H L L
------------------CGGGCGTACGTCGGCTACGAGCCCTCCGGCGTCCTCCACCTCGGCCACCTGCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T A N K L I D L Q D A G I E V V V L L A D V H A
T A N K L I D L Q D A - - E V V V L L A D V H .
ACCGCGAACAAGCTCATCGACCTGCAGGACGCC------GAGGTCGTCGTGCTGCTGGCGGACGTCCAC---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y L N D K G T F E E I R E T A E Q M K A Q F L A
. . . . . . . . . . . . E T A E Q M K A Q F L A
------------------------------------GAGACGGCCGAGCAGATGAAGGCCCAGTTCCTCGCC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y G L D E E Q T E F V L G S D Y Q L D E D Y E L
Y . . . . . . T E F V L G S D - - - - - - - - -
TAC------------------ACGGAGTTCGTCCTCGGCAGCGAC---------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D L H A L Q V E T S L K R A Q R A M A E I Q S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E T A K V S H V V Y P L M Q A L D I E Y L D V D
- - - - - - - - V Y P L M Q A L D I E - - - - -
------------------------GTCTACCCGCTGATGCAGGCCCTCGACATCGAG---------------
169170171172173174175176177178179180181182183184185186187188189190191192
L A I G G L D Q R K V H M L A R E E L P S L G Y
L A I G G L D Q R K V H M L A R E E L P S L - -
CTCGCCATCGGCGGCCTCGACCAGCGGAAGGTCCACATGCTCGCCCGCGAGGAACTCCCGAGCCTC------
193194195196197198199200201202203204205206207208209210211212213214215216
E K R P A L H T P I I G D L T T G E G K M S S S
- - R P A L H T - - - - - - - - - - - K M S S S
------CGGCCCGCGCTCCACACG---------------------------------AAGATGAGCTCCAGC
217218219220221222223224225226227228229230231232233234235236237238239240
E G V S I S M E D S T E E L A E K V N S A F C P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P E R D P E G D L V N P V L E L F Q Y H V F P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F E T V V V E R P D E Y G G D L S Y D D Y E S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A D D L E S G E L H P A D A K G A L A D Y L D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326
L V A P G R Q R L R E L R D
- - - - - - - - - - - - - -
------------------------------------------
Class I
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_tyr_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D L S E L L S R G V A E V I V E S E L R A R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q S G T P L R L K Q G F D P T K P D M H I G H A
- - - - - - R L K Q G F D P T . P D M H I G H A
------------------CGCCTGAAACAAGGGTTTGATCCGACA---CCCGACATGCATATCGGGCACGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V G L R K L R A F Q E L G H Q V V L I V G D W T
V G L R K L R A F Q E L - - Q V V L I V G D W -
GTAGGGCTGCGTAAGCTACGCGCCTTCCAAGAACTG------CAGGTGGTGTTGATCGTCGGTGACTGG---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A Q I G D P S G R D E T R A R L S A A E V R A N
- - - - - - - - - - - - - - - - - - - - - R A N
---------------------------------------------------------------CGCGCCAAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E T Y M E Q F F R V V D R Q R T E V R W Q S E
A E T Y M E Q F F R V . . . . . T E V R W Q S E
GCCGAGACCTACATGGAGCAATTTTTCCGGGTG---------------ACCGAGGTACGCTGGCAGAGTGAA
121122123124125126127128129130131132133134135136137138139140141142143144
W F G Q F T L E N A L D L A G R F T L A Q M L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
H E T F R K R Y E T G A P L T I L E L M Y P M L
- - - - - - - - - - - - - - - - - - - M Y P M L
---------------------------------------------------------ATGTATCCGATGCTG
169170171172173174175176177178179180181182183184185186187188189190191192
Q A Y D S V A I R A D V E F G G T D Q K F N I L
Q A Y D S V - - - - - V E F G G T D Q K F N I L
CAAGCGTATGACTCGGTC---------------GTTGAGTTTGGTGGTACGGACCAGAAGTTTAATATTCTC
193194195196197198199200201202203204205206207208209210211212213214215216
A G R E L M A Q L G M T P Q Q V F L V P L I P G
A G R E L M A Q L - - - - Q Q V F L V - - - - -
GCCGGACGAGAGCTGATGGCGCAGTTG------------CAGCAAGTCTTCCTGGTA---------------
217218219220221222223224225226227228229230231232233234235236237238239240
T D G R K M S K T F N N T V D I R M P P T E M Y
- - - - K M S K T - - - - - - - - - - - - - - -
------------AAGATGTCGAAGACG---------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G R I M S M S D E V L P L Y F E V L T D V P M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E I A E M K T A M A T G Q V N P R D L K M R L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R E I V A Q F H D P A A A A A A E A T F I R Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V E R E L P E D I P N F T L E A P T G I V D V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V A S G L A P S K S E A R R L I D G G G V R V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G E R V E G Y T L T I N P G A N V V V Q V G R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390
K F V R V V
- - - - - -
------------------
Class I
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_tyr_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D I K K I L A E V K R G C A E L I D E E R I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N L I K N Y Y E K G E N F F I K A G F D P T A P
- - - - - - - - - - - - - F I K A G F D P T . P
---------------------------------------TGCATTAGCACTGATGCTTCTTCTTGC---AGA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D L H L G H S V V L T K M A F L Q K H G A I V Q
D L H L G H S V V L T K M A F L Q K H - - I V Q
AGTAGAACTTTCCAAACCACATTCAACCAAAGCCTTAGCAAGCCAAATTTTTCCTTG------AAACTCAGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F L I G D F T G Q I G D P S G K S A T R K K L D
F L I G D F - - - - - - - - - - - - - - - - - -
CATATCACTTGGCAAAGC------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K E Q V L I N A K T Y K T Q V F K V L D K E K T
- - - - L I N A K T Y K T Q V F K V . . . . . T
------------CTCTGTAATCTCTAAAGCTAAATTTTCTTTAGCTTTTTTAGG---------------TTC
121122123124125126127128129130131132133134135136137138139140141142143144
Q I K F N S T W L N E L G A A G I V E L T S T F
Q I K F N S T - - - - - - - - - - - - - - - - -
TATATCTTTTTTTATTTGCGC---------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S V A R M L E R D D F T K R F K E Q S P I S I C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E F L Y P L L Q G Y D S V A L K S D I E M G G T
- - L Y P L L Q G Y D S V - - - - - I E M G G T
------ACTCATTTTGTTTACACCGTCTAAACCTTCGAG---------------CACAGCTTGTTCTTTTCC
193194195196197198199200201202203204205206207208209210211212213214215216
D Q K F N L L M G R Q L Q R V Y N I G K E Q A V
D Q K F N L L M G R Q L Q R V Y - - - - - Q A V
TATGTTATAAACTCTTTGAAGCTGTCTTCCCATCAAAAGATTAAATTT---------------CATTTCAAT
217218219220221222223224225226227228229230231232233234235236237238239240
I M M P L L E G L D G V N K M S K S L N N Y I G
I M M - - - - - - - - - - K M S K S - - - - - -
ATCGCTTTT------------------------------AGGATACAAAAACTC------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V T E K A N D M Y A K I L S I S D E L M F R Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E L L S Q K S L E E I A Q I K K D I E Q G N L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P K K A K E N L A L E I T E R F H S K E E A N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A K S E F D R I H S Q N A L P S D M A E F E I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G K I W L A K A L V E C G L E S S T S A A R R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I S A N A V S V N S Q K V S D E Q M Y L E Q G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401
Y I L Q I G K R K F A K L K V K E
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_tyr_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E D T P N L Y D V L E A R G L V A Q C T D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G I R E R L G S P V T L Y C G F D P T A D S L H
- - - - - - - - - - T L Y C G F D P T . D S L H
------------------------------GGGGTCCGCGACCTTGTCGCCGTGGAT---GACGCCGCCGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L G H L V P V M A L A H A Q R C G H K P L A L V
L G H L V P V M A L A H A Q R C - - K P L A L V
CTGGATCAGCCGGCGGGCCTCGCCGTTGCTCTTGGCGAAGCCGGCACG------CAGCTCGACGACGCCGAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G G A T A R V G D P S G K N T A R R M L S P E E
G G A - - - - - - - - - - - - - - - - - - - - -
GGGCGAGGC---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I D A N A L A I G E Q I G R I V R F D D S P T G
- D A N A L A I G E Q I G R I . . . . . . . . .
---GTCGCGCGCCGCCGCGGCCGCGGGCTCGCCGTGCACGAGCCG---------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A K L V N N L D W I A G L T W L D F L R D V G S
A K L V N N L D - - - - - - - - - - - - - - - -
CGCCGCGTTGATGCCGGCGCCGCT------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R V S V N R M V G M E S V K P R L A E G S G I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F L E F S Y M L L Q A Y D F A H L G A E H G C T
- - - - S Y M L L Q A Y D F A - - - - - - - - -
------------CCAGACCGCGCCGGCCTCGGTCTTGCCGAACTT---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V Q I G G Q D Q W G N I V F G T E L G R K M H G
V Q I G G Q D Q W G N I V F G T E L G R K M - -
CATCGTGAGCGCCGCCAGGTCCAGGCCGTGCATCTTCCGCCCCAGCTCGGTGCCGAAGACGATGTT------
217218219220221222223224225226227228229230231232233234235236237238239240
L D L A A L T M P L I T K A D G R K F G K T E A
- - L A A L T M - - - - - - - - - K F G K T - -
------CTGCCCGCCGATCTGCAC---------------------------GGCGAAGTCGTACGC------
241242243244245246247248249250251252253254255256257258259260261262263264
G A V W L D A E R T P V F D F F Q F W R N A D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G D V G R L L R Y F T F L P I D E I E A L E T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S G A G I N A A K A R L A Y E V T R L V H G E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A A A A A R D G A A K A F A G G A V D D A V P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G P L D L A S P V G V V E L M K R A G F A K S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G E A R R L I Q G G G V R I H G D K V A D P M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E V S A G D A R G G H V L L R A G K K R L Y R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415
D V A E A G S
- - - - - - -
---------------------
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_tyr_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T D S W T W L Q R G T H E I F P D Q P E S A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P D V S L L A R L Q Q G D R P L R I K L G I D P
- - - - - - - - - - - - - - - - R I K L G I D P
------------------------------------------------TCCGCCTTGAATTTGCCGACGCGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T G S D I H L G H S I I F R K L R Q F Q D A G H
T . S D I H L G H S I I F R K L R Q F Q D A - -
TTC---ACTGGTCAGCCCCAAGCCCACAGCACTGACTAAGTAAAAAGCCTTAGCAGGAAAGTTAAC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T A V L I I G D F T A R I G D P T G K S E V R R
T A V L I I G D F - - - - - - - - - - - - - - -
GAGCGGAAACTCCGGCACGGCTTCTGC---------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q L T A E D V Q R N A E T Y L D Q L R P I L D F
- - - - - - - Q R N A E T Y L D Q L R P I L - -
---------------------GTGGTATTGGCTAACAACATCAAGTGCCAGCAGTTTTTGGCGATC------
121122123124125126127128129130131132133134135136137138139140141142143144
E T P G R L E I R Y N S E W L A G L D L A K I L
- - - - - - E I R Y N S E - - - - - - - - - - -
------------------TAAATCTTGGCTAGTTAGCAA---------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E L L G T M T V G Q M L A K E G F S E R Y D K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T P V Y L H E F L Y P L M Q G Y D S V A V Q S D
- - - - - - - - L Y P L M Q G Y D S V - - - - -
------------------------CAAAATGGGCAGCAGTAAGCCGAATTGAGGCTG---------------
193194195196197198199200201202203204205206207208209210211212213214215216
V E L G G T D Q K F N I A V G R D L Q R H F G L
V E L G G T D Q K F N I A V G R D L Q R H F - -
CTGCAAGTCTCTTCCCACAGCAATGTTGAACTTTTGGTCTGTGCCACCCAGTTCTACATCCGATTG------
217218219220221222223224225226227228229230231232233234235236237238239240
Q P Q F G L L L P I L I G L D G S Q K M S K S L
- - Q F G L L L - - - - - - - - - - K M S K S -
------ATCGTAGCCCTGCATCAG------------------------------TGTTCCTTTGTCGTA---
241242243244245246247248249250251252253254255256257258259260261262263264
G N Y V G L N E D A L S M Y S K L E K V P D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V A D Y F E L L T S Q D L A A L P E N P R D R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K L L A L D V V S Q Y H G A E A A A A A Q K A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q E L V Q G S A V Q A E A V P E F P L S Q V N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P A K A F Y L V S A V G L G L T S S E A R R Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q G G A V R L D G Q K L D D P N H I F E A P T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402
L K G R V I Q V G K K K F V R L V L
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_tyr_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N F V E E L R W R G M V H D M M P G T E E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A K E Q V T A Y V G I D P T A D S L H I G H L C
- - - - - T A Y V G I D P T . D S L H I G H L C
---------------ACTGCTTATGTGGGTATTGACCCGACA---GATTCATTGCATATCGGACACTTATGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G V M I L R H F Q R C G H K P L A L I G G A T G
G V M I L R H F Q R C - - K P L A L I G G A - -
GGTGTGATGATATTGCGTCACTTCCAGCGTTGT------AAACCATTGGCTTTGATTGGTGGTGCG------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M I G D P S G K S A E R N L L D E E T L R H N Q
- - - - - - - - - - - - - - - - - - - - R H N Q
------------------------------------------------------------CGTCACAATCAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A C I K K Q L A K F L D F E S D A P N R A E L V
A C I K K Q L A K F . . . . . . A - - - - E L V
GCTTGTATCAAAAAGCAACTAGCTAAGTTT------------------GCT------------GAACTAGTG
121122123124125126127128129130131132133134135136137138139140141142143144
N N Y D W M K E F T F L D F A R E V G K H I T V
N N Y D - - - - - - - - - - - - - - - - - - - -
AACAACTATGAT------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N Y M M A K E S V K K R L N G E A R D G L S F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E F T Y Q L L Q G Y D F L H L Y E T K G C K L Q
- - T Y Q L L Q G Y D F L - - - - - - - - - L Q
------ACCTATCAGTTGTTGCAAGGTTATGACTTTCTT---------------------------CTGCAG
193194195196197198199200201202203204205206207208209210211212213214215216
M G G S D Q W G N I T T G T E L I R R T N G G E
M G G S D Q W G N I T T G T E L I R R T - - - -
ATGGGAGGCTCTGATCAGTGGGGAAATATCACTACCGGTACTGAACTGATTCGTCGTACT------------
217218219220221222223224225226227228229230231232233234235236237238239240
A Y A L T C P L I T K A D G G K F G K T E S G N
A Y A L T C - - - - - - - - - K F G K T - - - -
GCTTATGCATTGACTTGT---------------------------AAATTTGGTAAGACC------------
241242243244245246247248249250251252253254255256257258259260261262263264
I W L D P R Y T S P Y K F Y Q F W L N V S D A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A E R Y I K I F T S L D K A E I D G L I A E H N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E A P H L R V L Q K R L A K E V T V M V H S E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D Y N A A V D A S N I L F G N A T S D A L K K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D E D T L L A V F E G V P Q F E I S R D A L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G V K A V D L F V D N A A V F A S K G E M R K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V Q G G G V S L N K E K L A A F D Q V I T T A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430
L L D E K Y L L V Q R G K K N Y Y L I I A K
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_tyr_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N L L E E L Q W R G L V N Q T T D E D G L R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L L N E E K V T L Y C G F D P T A D S L H I G H
- - - - - - - T L Y C G F D P T . D S L H I G H
---------------------CGCGTCTTGGATGCGCTCCCCGTTCAC---AATGGCGCCGTTTTGGATGTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L V T I M T L R R F Q Q A G H Q P I A L V G G A
L V T I M T L R R F Q Q A - - Q P I A L V G G A
TTCGCGCGCCTGGCGCTTCGACGGCGAAATGCCGGCAGA------CAGCTCGACAAGCGGAACGTCGCCGCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T G L I G D P S G R K S E R T L N A K E T V E T
- - - - - - - - - - - - - - - - - - - - - - E T
------------------------------------------------------------------GTCGCC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
W S A R I K A Q L E R F L D F E A E S N P A K I
W S A R I K A Q L E R F . . . . A - - - - - K I
GCTAAAGAGCGCTTCAGAAATGCGAATCGCTTGCCT------------GCC---------------CACTTC
121122123124125126127128129130131132133134135136137138139140141142143144
K N N Y D W I G P L D V I S F L R D I G K H F S
K N N Y D - - - - - - - - - - - - - - - - - - -
CTCAGCAAGCGCCCT---------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V N Y M L A K E S V Q S R I E M G I S F T E F S
- - - - - - - - - - - - - - - - - - - - - - - S
---------------------------------------------------------------------TTG
169170171172173174175176177178179180181182183184185186187188189190191192
Y M M L Q A Y D F L N L Y E T E G C R L Q I G G
Y M M L Q A Y D F L - - - - - - - - - L Q I G G
GTAAAACTCATACGGCGACGTTTTTTCCGG---------------------------TTTTCCAAACTTCGT
193194195196197198199200201202203204205206207208209210211212213214215216
S D Q W G N I T A G L E L I R R T K G E A K A F
S D Q W G N I T A G L E L I R R T - - - - - A F
CCCATCGGCTTTCGTCACGAGCGGAACCGTCAAACCGAATGCTTTCGCCTC---------------GATGAG
217218219220221222223224225226227228229230231232233234235236237238239240
G L T V P L V T K A D G T K F G K T E S G A V W
G L T V - - - - - - - - - K F G K T - - - - - -
CTCAAGCCCCGC---------------------------ACCGATTTGTAGTCG------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L D P E K T S P Y E F Y Q F W I N T D D R D V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R Y L K Y F T F L S K E E I G A L E Q E L R E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P E K R A A Q R A L A E E V T K L V H G E E A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R Q A I R I S E A L F S G D I A N L T A A E I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q G F K D V P S F I H E G G D V P L V E L L V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A G I S P S K R Q A R E D I Q N G A I Y V N G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R I Q D A G A V L T A E H R L E G R F T V I R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419
G K K K Y H L I R Y A
- - - - - - - - - - -
---------------------------------
Class I
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_tyr_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L T I D E I L S R G V S E V I V E A N V R R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L N A G K P L R L K L G I D P T R S D I H I G H
- - - - - - - R L K L G I D P T . S D I H I G H
---------------------CGCCTCAAATTGGGCATCGACCCAACC---AGCGATATTCATATTGGCCAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A V A L R K M R Q F Q E L G H T V V L I V G D W
A V A L R K M R Q F Q E L - - T V V L I V G D W
GCAGTGGCGTTGCGCAAGATGCGCCAATTTCAAGAGCTT------ACCGTCGTTTTGATTGTGGGCGACTGG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T A Q I G D P T G R D E S R P R L T V E E T K S
- - - - - - - - - - - - - - - - - - - - - - K S
------------------------------------------------------------------AAAAGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N A K Y Y M D Q V F K V I D P A K T E V R W Q S
N A K Y Y M D Q V F K V . . . . . T E V R W Q S
AACGCCAAATATTACATGGATCAAGTGTTTAAAGTG---------------ACTGAAGTTCGCTGGCAAAGC
121122123124125126127128129130131132133134135136137138139140141142143144
E W F G Q F D L E K A F G L I G R F T V N Q M L
E - - - - - - - - - - - - - - - - - - - - - - -
GAA---------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A H E T F R K R Y E A G Q Q L T V L E L M Y P M
- - - - - - - - - - - - - - - - - - - - M Y P M
------------------------------------------------------------ATGTACCCAATG
169170171172173174175176177178179180181182183184185186187188189190191192
L Q A Y D S I A I K P D I E F G G T D Q K F N I
L Q A Y D S I - - - - - I E F G G T D Q K F N I
CTGCAAGCCTACGATTCGATT---------------ATTGAGTTTGGTGGCACTGACCAAAAATTCAACATT
193194195196197198199200201202203204205206207208209210211212213214215216
L A G R Q L M E Q M G M E S Q D V I L V P L I I
L A G R Q L M E Q M - - - - Q D V I L V - - - -
TTGGCTGGGCGACAATTGATGGAACAAATG------------CAGGATGTCATCCTCGTG------------
217218219220221222223224225226227228229230231232233234235236237238239240
G T D G R K M S K S F N N S V D I L M S P N D K
- - - - - K M S K S - - - - - - - - - - - - - -
---------------AAGATGAGCAAAAGC------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y G K I M S M G D D V L P V Y Y E V W S D A P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A E V K A M S E A I K A G S V N P R D L K M Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A R D I I R Q L D G E A A A A E A E A E F I R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F Q Q R D L P T D M P E V A L S E A A N I V D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L V S T K L A A S K G E A R R L I D G G G V R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A G E K I S S Y D S L V Q P V G E Q I L Q V G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393
R K F V K L L G N
- - - - - - - - -
---------------------------
Class I
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_tyr_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T P E E Q V K I L K R N V V D L I S E E E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D R I K R K G K L R V K L G V D P S R P D L H L
- - - - - - - - - R V K L G V D P S . P D L H L
---------------------------CTCTATCCTCTCTCCGTCGATGTACAC---ACCTTGAGAAACGAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G H A V V L R K L R E F Q D L G H T V V L I I G
G H A V V L R K L R E F Q D L - - T V V L I I G
TCTTTTAGCCTCACTTTTGCTGGATGCAGCTCCTATCTCCACGAG------CACGATGTTCTTCTCCTGAGA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D F T A R I G D P S G R N E T R P M L T K E E V
D F - - - - - - - - - - - - - - - - - - - - - -
AATCTC------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E N A K T Y Q E Q A F K I L D P K R T E L R F
L E N A K T Y Q E Q A F K I . . . . . T E L R F
CTTTGCGTTTTCTTCACCATGGAAGAAGCGCGTTATCTCGTA---------------CACGTCTCGTGGATT
121122123124125126127128129130131132133134135136137138139140141142143144
N G E W L D R M T F A D V I I L A S K Y T V A R
N G E - - - - - - - - - - - - - - - - - - - - -
GATCGTTTT---------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M L E R D D F A K R F K E G I P I A I S E F L Y
- - - - - - - - - - - - - - - - - - - - - - L Y
------------------------------------------------------------------GAAAGC
169170171172173174175176177178179180181182183184185186187188189190191192
P L A Q A Y D S V A I Q S D V E L G G T D Q L F
P L A Q A Y D S V - - - - - V E L G G T D Q L F
GATGTAGTTTCCGTAGCTTTTGCTCAT---------------TGTTCCCTCGATGATCGGCATCGTCATGAC
193194195196197198199200201202203204205206207208209210211212213214215216
N L L V G R K I Q E E Y G Q E P Q I V M T M P I
N L L V G R K I Q E E Y - - - - Q I V M T M - -
GATCTGGGGCTCTTGACCGTATTCTTCCTGTATCTT------------GAGGTTGAAAAGCTGATC------
217218219220221222223224225226227228229230231232233234235236237238239240
I E G T D G K L K M S K S Y G N Y I A F N D P P
- - - - - - - - K M S K S - - - - - - - - - - -
------------------------GGCAACGGAATCGTA---------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E E M Y G K L M S I P D E L I I K Y M R L L T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I P E E R I E E Y E R K M K E K T I N P R D V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
M V L A Y E I T R F F H G E E N A K K A Q E H F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V K V F Q K K E I P D E M P V V E I S Q E K N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V D L L V E I G A A S S K S E A K R L V S Q G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V Y I D G E R I E D I K F T V E P D G E R V L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401
V G K R K F Y R I S G G E T K K L
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class I
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_tyr_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T P E E Q L R I I K E G T V E I I E E E E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K K L K E G R P L R V K A G F D P T A P D L H L
- - - - - - - - - R V K A G F D P T . P D L H L
---------------------------GTTTATTTTAAGACCTCCGCCCTGTAT---TCTTCTGGCTTCGTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G H V V L L Q K L R Q F Q Q L G H E V F F I I G
G H V V L L Q K L R Q F Q Q L - - E V F F I I G
CTTTGATTTTACCGCTCCTATTTTTACGAGGAAATCTACGGCTCT------TTTCTCATTTAGTTTTACAAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D F T A M I G D P T G R S Q T R P P L S R E Q V
D F - - - - - - - - - - - - - - - - - - - - - -
AGGTGC------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E N A K T Y E H Q V F K V L I P E K T T V V F
L E N A K T Y E H Q V F K V . . . . . T T V V F
TTCCGAGTGAAAGCGCTTGACTATAGTAAAGGCGAGGAGTTT---------------GTGCATCTCCCTTCT
121122123124125126127128129130131132133134135136137138139140141142143144
N S T W L E E L G T K G L I E L C A K Y T V A R
N S T - - - - - - - - - - - - - - - - - - - - -
CATTTTCTC---------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M L E R E D F S K R F K E G I P I Y I H E F I Y
- - - - - - - - - - - - - - - - - - - - - - I Y
------------------------------------------------------------------TGACAT
169170171172173174175176177178179180181182183184185186187188189190191192
P L L Q A Y D S V A I K A D V E I G G T D Q K F
P L L Q A Y D S V - - - - - V E I G G T D Q K F
CTTCCTTACGCCGTCCGTTCCCACGAG---------------GCACACCTGAGGCTCCTGCCCGTACTCCCT
193194195196197198199200201202203204205206207208209210211212213214215216
N L L I G R D I Q R E Y G Q E P Q V C I T L P L
N L L I G R D I Q R E Y - - - - Q V C I T L - -
CTGTATGTCTCTACCTATGAGTAGGTTAAACTTTTG------------TATCTCAACGTCAGCCTT------
217218219220221222223224225226227228229230231232233234235236237238239240
L V G T D G V R K M S K S Y G N Y V G I T E D P
- - - - - - - - K M S K S - - - - - - - - - - -
------------------------CGGATATATAAACTC---------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K T M F A K I M S I P D E I M W D W F L L L T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y N K E E I E K M R R E M H P M E A K K L L A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T I V K R F H S E E E A R K A K E W W E K T F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q R E F P E D A P L V K L N E K K L R A V D F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V K I G A V K S K N E A R R V I Q G G G L K I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G E K V T D P N T E I E I N G E L K V K V G K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392
K F Y R V V S G
- - - - - - - -
------------------------
Class I
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_tyr_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S F P P V D E Q L A V L T R G A A Q F D G S M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R E E L K K K L E K S F T S G K P L R V K Y G I
- - - - - - - - - - - - - - - - - - R V K Y G I
------------------------------------------------------GATCTTCCGCCGCGCCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D P T G F D V H L G H T V P L R K L R Q F Q E F
D P T . F D V H L G H T V P L R K L R Q F Q E F
ACTTTTACT---TGTCAGCTTCGTTTCGGCGATCAGGTCGACGGCCAGCATCGCGCCGTCTTTAATCTTGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G H T A V L I I G T A T A A V G D P S G R D A S
- - T A V L I I G T A - - - - - - - - - - - - -
------TATGCTGATGTCGTCAATGTTAACGGG---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R Q G L T T E Q I D K N A Q T Y L T Q I A K V V
- - - - - - - - - D K N A Q T Y L T Q I A K V .
---------------------------GAAGCGCACGATGTCTGCCGCCAGCGTTTTCTTGGCTTCCAG---
121122123124125126127128129130131132133134135136137138139140141142143144
D V S K A E V R P N G E W F S K F T F A D M L K
. . . . A E V R P N G E - - - - - - - - - - - -
------------TCGGGTTACGTCCTCGTGCGACCG------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L L G H T T M Q R M I E R D D F T K R I K A G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A I Y L H E C L Y P L M Q G H D S V E I R A D V
- - - - - - - L Y P L M Q G H D S V - - - - - V
---------------------GTCCGTGCCGCGAAGGATCGGCATCGTGAGGCA---------------GCC
193194195196197198199200201202203204205206207208209210211212213214215216
E L G G T E Q L Y N L M V G R D L Q R A A G Q E
E L G G T E Q L Y N L M V G R D L Q R A A - - -
GGCGGCCCGCTGAAGGTCGCGGCCCACCATCAGGTTGTAAAGCTGTTCGGTGCCGCCGAGTTC---------
217218219220221222223224225226227228229230231232233234235236237238239240
P Q I C L T M P I L R G T D G E K K M G K S V G
- Q I C L T M - - - - - - - - - - K M G K S - -
---GATCTCGACGGAGTCGTG------------------------------CAGGTAGATCGCGGC------
241242243244245246247248249250251252253254255256257258259260261262263264
N Y I G L N E P A K D M F G K T M R I H D E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T E W Y A L L T D R S H E D V T R L L T T P L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A K K T L A A D I V R F Y H G E E V A S A T R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D W D N A A K N I D P V N I D D I S I P A D K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K D G A M L A V D L I A E T K L T A S K S E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R K I E E G A F N Y G P G R T K P A D V K A T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404
P V T D G L V I R L G R K I L R V R L G
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class I
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_tyr_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S V T N L S S P R Q E P S S Q L A T A T P D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N W L R R G V S E I F P D Q P D S S N P E E N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E K L L K M T N R P L R I K F G I D P T G A E I
- - - - - - - - - - - R I K F G I D P T . A E I
---------------------------------ACTGGCGCTGACAATGTAAAACAATTT---TGGAAATTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H L G H S I P V R K L R A F Q D A G H K A V L L
H L G H S I P V R K L R A F Q D A - - K A V L L
GATTTGAGATAGCGAAAATTCTGGTACGGCTGAAGTATCGGCTGTATTGCC------CAGTGACATTGCTGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I G D F T A R I G D P T G R S E V R R Q L S A A
I G D F - - - - - - - - - - - - - - - - - - - -
TTTTTGAGCGTT------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E V A E N A K N Y L D Q V R P I L D F A P D K L
- - A E N A K N Y L D Q V R P I L - - - - - - -
------GGGAGTTTCCGGCAATCCATCTAAGGGTAAATTTGTCAATAACTC---------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E V R Y N S E W L S K L D L T K I L E L L S T M
E V R Y N S E - - - - - - - - - - - - - - - - -
GTCTGGCGTTTTTTCCAGCTT---------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T V G Q M L A K E G F A E R Y E K E N P I Y I H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E F L Y P L V Q G Y D S V A L E A D V E L G G T
- - L Y P L V Q G Y D S V - - - - - V E L G G T
------TCTTTGCAAATCTCGCCCTACAGCAATGTTAAA---------------ACCCAACTCTACATCTGC
217218219220221222223224225226227228229230231232233234235236237238239240
D Q K F N I A V G R D L Q R H F G Q K P Q F G V
D Q K F N I A V G R D L Q R H F - - - - Q F G V
TTCTAACGCTACAGAATCGTATCCCTGTACCAGGGGATAGAGAAATTC------------GGGATTTTCTTT
241242243244245246247248249250251252253254255256257258259260261262263264
L L P I L I G T D G N Q K M S K S L G N Q V G L
L L - - - - - - - - - - K M S K S - - - - - - -
CTCGTA------------------------------TTGCCCGACAGTCAT---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L E E P L L M Y S K L E K T P D H L L K D Y F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L L T N L P L D G L P E T P R D R Q K L L A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V V S Q Y H G K E A A Q N A Q K A A M S L V Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N T A D T S A V P E F S L S Q I K F P A K L F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I V S A S G L C P T S S E A R R Q V Q G G A V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L D G D R L N Q V D L I F N S P D E L D G K V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423
Q V G K N K F V K L V N G N G
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_tyr_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N S F L K E L Q E K N L I Q D I S N I E K I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N S L K N K M G I Y V G F D P S A K S I H L G N
- - - - - - - G I Y V G F D P S . K S I H L G N
---------------------GGTATTTATGTAGGTTTTGATCCAAGT---AAAAGCATTCATTTAGGAAAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F V V I N V L L I A K K H R I P T V A L I G G A
F V V I N V L L I A K K H - - P T V A L I G G A
TTTGTTGTTATTAATGTACTTTTAATTGCAAAAAAACAC------CCAACAGTCGCTTTAATTGGTGGAGCA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T G G I G D P S G K K S E R I L I D E D T L K K
- - - - - - - - - - - - - - - - - - - - - - K K
------------------------------------------------------------------AAAAAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N T E A I K K Q I K H F L P D A K I V N N S D F
N T E A I K K Q I K H F . . . A K I V N N S D -
AACACAGAAGCAATTAAAAAGCAAATTAAACATTTT---------GCAAAAATTGTTAATAATAGTGAT---
121122123124125126127128129130131132133134135136137138139140141142143144
Y K N Q S F I D F L R D V G K F I Q V S Y M L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K E I V K N R L E S G I S F T E F A Y S L I Q A
- - - - - - - - - - - - - - - - - A Y S L I Q A
---------------------------------------------------GCATATTCACTAATTCAAGCA
169170171172173174175176177178179180181182183184185186187188189190191192
N D F H Y L F K N H N V G I Q F G G S D Q W G N
N D F H - - - - - - - - - I Q F G G S D Q W G N
AATGATTTTCAT---------------------------ATTCAATTTGGAGGTTCAGATCAATGAGGGAAT
193194195196197198199200201202203204205206207208209210211212213214215216
I T T G L E L I R K R N G E N S F S G G F T I K
I T T G L E L I R K R - - - - - - S G G F T I -
ATTACGACAGGTCTTGAATTAATTAGAAAAAGA------------------AGTGGAGGTTTTACAATC---
217218219220221222223224225226227228229230231232233234235236237238239240
L L L K S D G T K F G K S E Q G A I Y L D P S L
- - - - - - - - K F G K S - - - - - - - - - - -
------------------------AAATTTGGAAAAAGT---------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T S P Y T M Y Q F L L N Q N D S D L L N L F N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I S D L G I K E I L E I I T K H S E N P E K R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G Q K M L A N N I V N R I H G K N A L N E V E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I S N I L F K N G K I N D L S K S E V S I I I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S F E V N H V N F S N D E K I I D I L D R A K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F K S K N E I R K L I E Q K G L V V G A E I I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D F D Q I L K D S N L T H G V I F A R Q G K K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415
I F I I K K S
- - - - - - -
---------------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_tyr_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N L A L S L L H K R G F L K Q C T S L K V L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D L M D R E K I V F Y A G V D A T S S S L H I G
- - - - - - - - V F Y A G V D A T S S . L H I G
------------------------TACCCTTTTACCATTAATATAAACACCTCCAGA---AATCAATCTTCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H L I P F L A M M H L R Q H G H M P I V L I G D
H L I P F L A M M H L R Q H - - M P I V L I G D
GCCTTCTGATTTGCTGGGCACAATTTTTGAATCTAACATTAA------CAATAATATCTCTTCTTTTAGGCT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S T A K I G D P S G K S E M R K I L S S E E I G
S - - - - - - - - - - - - - - - - - - - - - - G
AGA------------------------------------------------------------------CTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N N A L L I K N Q L Q R I T K F T S E C F I H N
N N A L L I K N Q L Q R I . . . . . E C F I H N
TTGAACTTTCAAGGCTTCTGCCTCTCCGTGAACAATTTT---------------CAAAATCTCTTTGGCCTT
121122123124125126127128129130131132133134135136137138139140141142143144
S N W L D N L N Y I E F L R D V G M H F S V N R
S N - - - - - - - - - - - - - - - - - - - - - -
ATTTAA------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M L S F E T Y K R R M D F G L S F I E F N Y Q L
- - - - - - - - - - - - - - - - - - - - N Y Q L
------------------------------------------------------------AAAAAGATTAGA
169170171172173174175176177178179180181182183184185186187188189190191192
L Q S Y D Y Y M L N K I K N C R L Q I G G D D Q
L Q S Y D Y Y - - - - - - - - - L Q I G G D D Q
ATCAAGATAAACAGCGCCTTT---------------------------ACTTCTTGTAATTAATGGAAAAGT
193194195196197198199200201202203204205206207208209210211212213214215216
W G N I I S G V D L I R K K N G S E T F G L T F
W G N I I S G V D L I R K K - - - - T F G L T F
AAGCCCAAAAGTTTCTGATCCATTTTTTTTTCTAATTAGGTC------------AATATTCCCCCATTGATC
217218219220221222223224225226227228229230231232233234235236237238239240
P L I T R S D G K K M G K S E K G A V Y L D S N
- - - - - - - - - K M G K S - - - - - - - - - -
---------------------------TTTAATTTTATTAAG------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L F S I Y D F Y Q Y F R N T S D S D V K T F L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L F T F L E E D E I E L I S N F K G N S L N K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K E I L A F E I T K I V H G E A E A L K V Q E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S F A A F R G S G D R S N I P F F K F S F S S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K E E I L L V D L M L D S K I V P S K S E G R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L I D S G G V Y I N G K R V E S Q S H L L T K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405
D F N N N E V E L R V G K K K F L R I V I
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_tyr_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y D F I A N L R W R G M I H D I T P G L E A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L Q K E M I T G Y I G F D P T A P S L H V G N L
- - - - - - T G Y I G F D P T . P S L H V G N L
------------------ACTGGTTATATTGGTTTTGATCCTACA---CCTTCATTGCATGTAGGAAATCTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A T I M L L K H F Q L A G H K P I A V V G G A T
A T I M L L K H F Q L A - - K P I A V V G G A -
GCTACTATTATGCTGCTTAAACATTTTCAACTAGCA------AAGCCTATTGCCGTAGTAGGGGGTGCT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G M I G D P S F K S T E R K F L S E E E L L H N
- - - - - - - - - - - - - - - - - - - - - L H N
---------------------------------------------------------------CTACATAAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q S C I M K Q L K C F L D F S S S A N T A E L L
Q S C I M K Q L K C F . . . . . . A - - - E L L
CAATCATGCATTATGAAACAGTTGAAGTGTTTT------------------GCC---------GAGTTACTC
121122123124125126127128129130131132133134135136137138139140141142143144
N N I D W F K D F G F L R F L R E V G K H I S I
N N I D - - - - - - - - - - - - - - - - - - - -
AACAATATAGAT------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N Y M M A K E S V K R R L E D G I S F T E F S Y
- - - - - - - - - - - - - - - - - - - - - - S Y
------------------------------------------------------------------TCTTAC
169170171172173174175176177178179180181182183184185186187188189190191192
Q L L Q G Y D F Y Y L Y N T K G V K L Q M G G A
Q L L Q G Y D F Y - - - - - - - - - L Q M G G A
CAGTTGCTACAAGGATATGATTTTTAT---------------------------CTACAAATGGGTGGGGCA
193194195196197198199200201202203204205206207208209210211212213214215216
D Q W G N L T T G I E L I R R K T G E E A F A L
D Q W G N L T T G I E L I R R K - - - - A F A L
GATCAATGGGGAAATCTTACCACAGGTATAGAACTAATTCGTAGAAAA------------GCTTTTGCTTTA
217218219220221222223224225226227228229230231232233234235236237238239240
T A P L I T K A D G T K F G K S E Q G N I W L D
T A - - - - - - - - - K F G K S - - - - - - - -
ACTGCA---------------------------AAGTTTGGTAAGTCA------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S T M T S P Y E F Y Q F W L N C T D E D A C R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I K V F T L L S K E E I D N L I E L H V Q A P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q R I L Q K Q I A K E L T I R V H S E T D Y M Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A R K T S E L L F G H A T A E D L W E L S E K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F K V I F K S I P E V H I T L T Q L T E A E H M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L D L V A S T G F G I M F N S K G E V R R A I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E G S L S V N K E K I T D P L Q K P N L K L L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427
D K Y L L V Q R G K K H H Y L I K V S
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_tyr_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K M S E I R R N V P V N E Q I Q L L K R G V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D L V S E E D L K R K I E K G E P L R V K L G A
- - - - - - - - - - - - - - - - - - R V K L G A
------------------------------------------------------CGCGTCAAGCTCGGCGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D P T R P D L H L G H A V I L R K M R Q F Q D L
D P T . P D L H L G H A V I L R K M R Q F Q D L
GACCCCACC---CCCGACCTGCACCTCGGGCACGCCGTCATTCTGCGCAAAATGCGGCAGTTTCAGGACCTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G H K V I M L I G D F T A T I G D P S G K S K T
- - K V I M L I G D F - - - - - - - - - - - - -
------AAGGTCATCATGCTGATCGGCGACTTC---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R P P L S L E E A R A N A E S Y L A Q C R L I L
- - - - - - - - - R A N A E S Y L A Q C R L I L
---------------------------CGCGCCAACGCCGAGAGCTACCTCGCGCAGTGCCGCCTGATTCTG
121122123124125126127128129130131132133134135136137138139140141142143144
R Q E P E A L E I R Y N S E W L E Q L G Y K D I
- - - - - - - E I R Y N S E - - - - - - - - - -
---------------------GAAATCAGGTACAACTCCGAG------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I G L A A K Y T V A R I L E R D D F T K R L S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G T P I S M H E L L Y P L T Q G Y D S V A L H A
- - - - - - - - - L Y P L T Q G Y D S V - - - -
---------------------------CTCTACCCGCTCACCCAGGGCTACGACTCGGTG------------
193194195196197198199200201202203204205206207208209210211212213214215216
D V E L G G T D Q L F N N L V G R A L Q R D Y G
- V E L G G T D Q L F N N L V G R A L Q R D Y -
---GTGGAACTCGGGGGCACCGACCAGTTGTTCAACAACCTGGTGGGCCGCGCCCTGCAACGCGACTAC---
217218219220221222223224225226227228229230231232233234235236237238239240
Q E A Q V V L T L P L L V G L D G T E K M S K S
- - - Q V V L T L - - - - - - - - - - K M S K S
---------CAGGTCGTGCTGACGCTG------------------------------AAGATGTCCAAGAGC
241242243244245246247248249250251252253254255256257258259260261262263264
L D N Y I G L T D E P H A M F A G L M K V P D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L L D N Y F T L L T D L P R E R I E E L L A G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P V A A H R E L A R E V V R A F H P D A D L D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A E A R F R S V A K G G I P D N I P A V S V P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S E L N E Q G H V S M A K L V V L A G L E P S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G A A R K L I Q N R G L K L G G E T Y S D P Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q L T R E Q L T E G V V I Q K G K D K F A R L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411
L E G
- - -
---------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_tyr_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N T D D R Y K L L R S V G E E C I Q E S E L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N L I E K K P L I R C Y D G F E P S G R M H I A
- - - - - - - - - R C Y D G F E P S G R M H I A
---------------------------CGCTGCTACGATGGCTTCGAGCCCTCCGGCCGCATGCACATTGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q G I F K A V N V N K C T A A G C E F V F W V A
Q . I F K A V N V N K C T A A - - E F V F W V A
CAG---ATCTTCAAGGCGGTCAATGTCAACAAGTGCACCGCCGCC------GAGTTTGTCTTCTGGGTGGCG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D W F A L M N D K V G G E L E K I R I V G R Y L
D W - - - - - - - - - - - - E K I R I V G R Y L
GACTGG------------------------------------GAGAAGATCCGCATTGTTGGCCGGTACCTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I E V W K A A G M D T D K V L F L W S S E E I M
I E V W . . . . . . . . . V L F L W S S E - - -
ATTGAGGTGTGG---------------------------GTTTTGTTTTTGTGGAGCAGCGAG---------
121122123124125126127128129130131132133134135136137138139140141142143144
S H A D T Y W R M V L D I G R Q N T I A R I K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
C C T I M G K T E G T L T A A Q V L Y P L M Q C
- - - - - - - - - - - - - - - - - L Y P L M Q C
---------------------------------------------------CTGTACCCGCTGATGCAGTGC
169170171172173174175176177178179180181182183184185186187188189190191192
C D I F F L K A D I C Q L G L D Q R K V N M L A
C D I F - - - - - I C Q L G L D Q R K V N M L A
TGCGACATCTTC---------------ATCTGCCAACTGGGCCTGGACCAGCGCAAGGTGAACATGCTCGCA
193194195196197198199200201202203204205206207208209210211212213214215216
R E Y C D L I G R K L K P V I L S H H M L A G L
R E Y C D L I - - - - - P V I L S H - - - - - -
CGCGAGTACTGCGACCTGATT---------------CCGGTCATTCTGTCACAC------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R R G Q A K M S K S D P D S A I F M E D T E E D
- - - - - K M S K S - - - - - - - - - - - - - -
---------------AAGATGAGCAAGAGT------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V A R K I R Q A Y C P R V K Q S A S A I T D D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A P V A T D D R N P V L D Y F Q C V V Y A R P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A V A A I D G T T Y A T Y E D L E Q A F V S D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V S E D A L K S C L I D E V N A L L A P V R Q H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F A S N E E A H E L L E A V K S Y R K G G A T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P L A E T A L P A A P E K P H A C M W M P A L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K V P L D V A E G M I K A T E D F I A A H P G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T V T V V L P D W S A V A S D E I T G V E K D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S A A L Q V N C A L L K A Y G L P N S V K I V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E N E V I L G N R N D F W V S V I G I A R K N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L S H I E E L Y G G E L R N A G Q V I A A L M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V A T A L M L S V S H V I S T S L D G H I N A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A R E Y T K E R I E C V Q T L E G R I P A L H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P G A A P A V L G A D D V L Y L D D N D M D I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R K I K K A Y S A P N E E A N P V I S V A Q H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L A Q H G A L N I E R G E A N G G N V S Y N T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E A L V A D C G S G A L H P A D L K A A V L Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L L D R S A Q A R A L L N G E L K K N M T A L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682
N A E K K M A K K R
- - - - - - - - - -
------------------------------
Class I
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_tyr_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S S N S C T E T I P K Y I L K G S E E P L K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S K L T L E E R H K L C L S V G E E C I Q E A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L L E L L K R K E H P I C Y D G F E P S G R M H
- - - - - - - - - - - I C Y D G F E P S G R M H
---------------------------------GGTAAAGGTGATATCACCACCATACTCTTCTTTTCTAGA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I A Q C I L K T I N V N K L T E C G C V F V F Y
I A Q . I L K T I N V N K L T E C - - V F V F Y
AACATGGAA---ACCGAATTTGGGGAATACTAGAGTATTAATATATTCAAT------ATTTCCTTCAATAAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V A D W F A L L N N K M G G D L E K I K I V G E
V A D W - - - - - - - - - - - - - - - K I V G E
GCCTGGAGGACA---------------------------------------------AACAAATATTGCAGA
121122123124125126127128129130131132133134135136137138139140141142143144
Y F V H I W K A A G M D M T N V R F V W A S D F
Y F V H I W K A A . . . . . . V R F V W A S D -
AGAAGTGTCAGATTTTGACATTTTTTC------------------AGGAAGCATCTTATGGGAAAGGAT---
145146147148149150151152153154155156157158159160161162163164165166167168
I N G E D S N E Y W L R V F D I S R K F N I T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I K R C C Q I M G R Q E N D E Q P C A S V F Y P
- - - - - - - - - - - - - - - - - - - - - F Y P
---------------------------------------------------------------TGAAGCACA
193194195196197198199200201202203204205206207208209210211212213214215216
C M Q C A D I F Q L K A D I C Q L G M D Q R K V
C M Q C A D I F - - - - - I C Q L G M D Q R K V
CGGTTGTTCATCATTTTCTTGTCT---------------ACATCTTTTAATTCTAGTAATATTAAACTTTCT
217218219220221222223224225226227228229230231232233234235236237238239240
N M L A R E Y C D A A G I K H K P V I L S H K M
N M L A R E Y C D A A - - - - - P V I L S H K M
AGAAATATCAAAAACTCTTAACCAATACTCATT---------------AATAAAATCAGATGCCCAAACAAA
241242243244245246247248249250251252253254255256257258259260261262263264
L P G L L E G Q E K M S K S D T S S A I F V E D
L - - - - - - - - - - - - - - - - - - - - - - -
TCT---------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T P E A V V K K I K K A F C P P G I I E G N P C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I E Y I N T L V F P K F G H F H V S R K E E Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G D I T F T N K E D F H K A Y L S G D L H P G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L K K G L S D A L N L M L Q P I R D H F N T D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376
R A K E L L Q L V Q S F K V T K
- - - - - - - - - - - - - - - -
------------------------------------------------
Class I
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_tyr_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A T D A V T V L E P E K E Q G A Q Q L K I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V L R S R G L V Q D I T S P S L E K V A A T E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L T V Y C G F D P T A E S L H L G N L L G I I V
- T V Y C G F D P T . E S L H L G N L L G I I V
---ACGGTGTACTGCGGATTCGACCCCACA---GAGAGCCTGCACTTGGGCAACTTGCTGGGCATCATCGTG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L T W F Q R C G H Q P V A L L G G A T G R V G D
L T W F Q R C - - Q P V A L L G G A . G R V . .
CTCACTTGGTTCCAGCGCTGC------CAGCCAGTGGCTCTGCTGGGGGGTGCA---GGCCGTGTG------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P S G R S T E R P V L S E D E I E R N V Q G I R
. . . . . . . . . . . . . . . . . . N V Q G I R
------------------------------------------------------AATGTTCAGGGCATCAGG
121122123124125126127128129130131132133134135136137138139140141142143144
R I L E S L I G S S N G A G P A P Q I L N N L D
R I L E - - - - - S . . . . P - - Q I L N N L D
CGGATCTTGGAG---------------AGC------------CCT------CAAATCCTGAACAACCTGGAT
145146147148149150151152153154155156157158159160161162163164165166167168
W F K E V G L L S F L R D V G K F A R V G T M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A R D A V K S R M E L D N E G I S F T E F T Y Q
- - - - - - - - - - - - - - - - - - - - - T Y Q
---------------------------------------------------------------ACCTACCAG
193194195196197198199200201202203204205206207208209210211212213214215216
L L Q G Y D F V H L N R E H G V R M Q I G G S D
L L Q G Y D F V - - - - - - - - - M Q I G G S D
CTGCTGCAGGGGTATGACTTTGTG---------------------------ATGCAGATAGGCGGGTCGGAT
217218219220221222223224225226227228229230231232233234235236237238239240
Q M G N I I T G L D L I R R M G G G A P E A A C
Q M G N I I T G L D L I R R M - - - - - - - - C
CAGATGGGCAACATCATCACAGGGCTGGACCTCATCCGGCGCATG------------------------TGC
241242243244245246247248249250251252253254255256257258259260261262263264
F G L T F P L L T K A D G T K M G K S A D G A V
F G L T F - - - - - - - - - K M G K S - - - - -
TTCGGCCTCACTTTC---------------------------AAAATGGGCAAGAGC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
W L A A E K M S P F K F Y Q Y L L T S V G D A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V I K F L R M L T F V P L E D I A Q L E A S M Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q P G Y Q P N T A Q R L L A S E V T R F V H G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L G L D Q A L N A T Q A L A P G S D T K L D I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T L E A V A G S A P T V E L P A G Q V L G Q T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A D I M V A I K L Q E S K S A G R R L I K G G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V R V N N Q K V S D E Q R R L S E D D F I D G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450
L A L I A A G K K N K M L L R I S R
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_tyr_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T T L A T L P P L T P A Q K Q H L L E K L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D I M C P E E L H A L L H A D G N K R L T C Y D
- - - - - - - - - - - - - - - - - - - - T C Y D
------------------------------------------------------------TGCAATTCTTCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G F E P S G R I H I A Q G I A K A I N V N R L L
G F E P S G R I H I A Q . I A K A I N V N R L L
CTCCACATATGCCGTCTCCAGCTCCTCATAATTAGC---TTGACTGCAGTCAGCGGCACTACCGTCCCGGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R S G I D C V F Y V A D W F A A L N N K C D A E
R S - - D C V F Y V A D W - - - - - - - - - - -
GTATGG------AACAACTGATCCTAAACACTCTGTTGA---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L S K I Q I L G R Y F V E V W K A C G M L G V S
- - - - Q I L G R Y F V E V W K A C . . . . V -
------------CTCAAGAATAGGATTGCCGCTCTCGGCTCCTGGTTCTGGACA------------GAT---
121122123124125126127128129130131132133134135136137138139140141142143144
K P V V F S T G Q K A S V R F V W A S E F I R Q
- - - - - - - - - - - - - R F V W A S E - - - -
---------------------------------------AGAGTCAGGAACAGACTTGCT------------
145146147148149150151152153154155156157158159160161162163164165166167168
N S S S Y W M R V M N I A R S F T V P R M Q R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S T I M G R T E G D D Q P I S Q I L Y P S M Q C
- - - - - - - - - - - - - - - - - L Y P S M Q C
---------------------------------------------------AACCAGATCCAGCTTTAGCTC
193194195196197198199200201202203204205206207208209210211212213214215216
A D I F E L K L D L V E M G L D Q R K V N A L A
A D I F - - - - - L V E M G L D Q R K V N A L A
AAAGATATCCGC---------------ATATAGTATTTGAGAAATTGGCTGATCATCACCCTCTGTTCGGCC
217218219220221222223224225226227228229230231232233234235236237238239240
R D Y C D K S V E L R H H K P V I L M H H M L L
R D Y C D K S - - - - - - - P V I L M H - - - -
CATTATAGTTGAGCATCGCTG---------------------ACGTGCAATATTCATTAC------------
241242243244245246247248249250251252253254255256257258259260261262263264
G L V G D G K M S K S V P D S A I Y M D D S F E
- - - - - - K M S K S - - - - - - - - - - - - -
------------------GATGAACTCACTTGC---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E I Q R K I M N A S C P E P G A E S G N P I L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y Y K Y I V F G A I E Q E M I S T E C L G S V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V L P Y D R D G S A A D C S Q F A N Y E E L E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A Y V E G R I A P H V L K S S L V H Y I D S L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A P V R A H F K S T P E L S R L L S D V H N I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387
S V R
- - -
---------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_tyr_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K E S T S N R I L P K W L M R G I V D L F P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A S E G S S D Q I F Q L R L S E A E K F A R P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R V K L G I D P T G T D I H L G H S I L F R K L
R V K L G I D P T G . D I H L G H S I L F R K L
CGTGTAAAACTAGGTATTGATCCGACTGGT---GATATTCACCTCGGGCACAGTATTTTGTTCAGAAAGTTG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R A F Q D A G H I A V L I I G D F T A R I G D P
R A F Q D A - - I A V L I I G D F . A - - - - -
AGAGCTTTTCAAGATGCA------ATAGCCGTTTTAATTATAGGCGACTTT---GCT---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T G K N T T R V Q L S I E E V E A N A Q T Y L Q
- - - - - - R . . . . I . . . . . N A Q T Y L Q
------------------AGA------------ATC---------------AATGCTCAAACCTATTTACAG
121122123124125126127128129130131132133134135136137138139140141142143144
Q L G K D Q P K E K A L L D F E T P G R L E V Y
Q L G K D . . . . . . L - - - - - - - - - E V Y
CAGCTTGGAAAAGAC------------------TTA---------------------------GAGGTGTAC
145146147148149150151152153154155156157158159160161162163164165166167168
Q N S T W L G E M D L L E I I K L L G T A T V G
Q N S T - - - - - - - - - - - - - - - - - - - -
CAAAATAGCACC------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q M L A K E D F A N R Y K L G T P I A L H E F L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------TTA
193194195196197198199200201202203204205206207208209210211212213214215216
Y P L L Q G Y D S V A I R A D V E L G G T D Q R
Y P L L Q G Y D S V - - - - - V E L G G T D Q R
TATCCTTTGCTACAAGGATATGATTCTGTT---------------GTTGAGTTAGGGGGGACTGATCAACGA
217218219220221222223224225226227228229230231232233234235236237238239240
F N V A I G R D L Q R Y Y G Q R P Q F C L L L P
F N V A I G R D L Q R Y Y - - - - Q F C L L L -
TTTAATGTTGCAATAGGACGTGATCTTCAGAGGTATTAT------------CAGTTTTGTTTATTATTA---
241242243244245246247248249250251252253254255256257258259260261262263264
I L P G L D G V Q K M S K S L H N T V N L T E D
- - - - - - - - - K M S K S - - - - - - - - - -
---------------------------AAAATGAGTAAAAGT------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A L S M Y S K L E K L P D N V V N Q Y L T L L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D I D L A N L V G T P R E R Q K R M A F Q I T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N W H G D A A A S A A Q L D A A K L V V G I A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I E L K Q N L K E V S L N E V K F P A K A F Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L S A V G I C A S S S E A R R K I Q G G G V R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D G E K I I D P N Q E F A K A S D L S G K V L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420
L G K K I F R R L I L S
- - - - - - - - - - - -
------------------------------------
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_tyr_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_tyr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N E K L S N L K I T E N N K S I G W R V V V G
- - - - - - - - - - - - - - - S I G W R V V V G
---------------------------------------------AGTATAGGCTGGAGAGTTGTTGTAGGT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D N L H L G H V S S L L K I I M E V K D V G Y A
D N L H L G H V S S L L K I I M . V K D V - - A
GATAATCTACATTTAGGACATGTCTCAAGTCTTTTAAAAATAATAATG---GTTAAAGATGTT------GCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V R I L I D D L D Y S L K H N E N L L N K N R E
V R I L I D D L - - - - - - - - - - - N K N R E
GTGAGAATTCTTATAGATGATTTG---------------------------------AACAAAAATAGAGAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A I K K I I I K I F K S Y N I K N V S F F L S S
A I K K I I I K I . . . . . . . . V S F F L S S
GCGATTAAGAAAATAATAATTAAGATT------------------------GTTAGTTTTTTTTTGTCTTCT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D L R N S E N Y V N D F Y K L I S V T T E D E A
D - - - - - - - - - - - - - - - - - - - - - - -
GAT---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A L C L E T S N D V K M G D L L Q P V L K T L D
- - - - - - - - - - - - - - - L Q P V L K T L D
---------------------------------------------TTACAACCCGTTCTTAAGACACTTGAT
145146147148149150151152153154155156157158159160161162163164165166167168
F L Y L D V D I I V H C N D K V V S L V E K S K
F L - - - - - I I V H C N D K V . S L V E K S K
TTTTTA---------------ATTATTGTTCATTGTAATGATAAAGTG---AGTTTAGTTGAAAAAAGTAAA
169170171172173174175176177178179180181182183184185186187188189190191192
Q F I N L D I K S I K Y I N N G L I C N F K N N
Q F I N L - - - - I K Y I N N - - - - - - K N N
CAATTTATTAATTTA------------ATTAAATATATTAATAAT------------------AAAAACAAT
193194195196197198199200201202203204205206207208209210211212213214215216
K I P D L D K T L S I W L F D K E R V V Y K K I
K I - - - - - - - - - - - - - - - - - - - - - -
AAGATA------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N K F F C E E G N T D T S V L K I F E S I I F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F V K L E N K H L N I T T V D G N I I T Y N N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E E L M S D F K N K L V H P A D L K T S C S N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297
I L E I F K K F S
- - - - - - - - -
---------------------------
Class I
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_val_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G A E P S S A P T F R P K I E E K R W S K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E K E L L S K W S K E K L Y E F N P E R E G P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L I I D T P P P Y P S G K W H V G G A A H Y A Q
- I I D T P P . Y P S G K W H V G G A A H Y A Q
---ATCATAGATACGCCGCCT---TATCCTAGCGGCAAATGGCACGTAGGTGGTGCGGCACATTACGCACAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I D M I A R Y F R M K G W N V F V P W Y A D R N
I D M I A R Y - - - - - - - - F V P W Y A D R N
ATAGACATGATAGCACGCTAC------------------------TTTGTACCATGGTATGCCGATCGTAAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G L P V E V A V E K K Y K I V A H E M A K T K E
G - - - - - - - - - - - - - - - - - - - - - - -
GGC---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G R L K F L E L C S K E L D K I E E E L V R I W
- - - - - - - - - - - - - D K I E E E L V R I W
---------------------------------------GACAAAATAGAGGAAGAGCTGGTAAGAATATGG
145146147148149150151152153154155156157158159160161162163164165166167168
S R L G C S F T Y I Q N G T D S P E Y R R I T Q
S R L . . . . T - - Q N G T D S - - - - - - - -
TCCCGGCTT------------ACA------CAGAACGGGACAGATAGC------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A T F I E L W R R G L I Y E A E R P V N W C P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C R T T L S E A E I E H R E E D A Y L Y Y V K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K V K E T G E E I V I A T T R P E L I G A A R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V V Y N P E D E R Y K R L K G L H A I V P I Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y E V P I L E H P A A K P E F G T G L V M V S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y G D W T D V Q M L K D L G L E P K V I V N Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G T L N E K A G F L Q G L P I R E A R R R I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E L E K H G L I E K K E S L R H S V P I C W R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K T P V E I V H V R E Y F L K Q L E F K D K L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I A L K V H F R P E K H R R K L L D W I D S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K M D W P I S R T R Y Y G T E I P L W T C R R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G A K L V P E P G R Y Y R P W L E E P P W D K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P K C G A P R S E L E G E K R V F D T W F D S S
- - - - - - - - - - - - - - - - - D T W F D S S
---------------------------------------------------GACACATGGTTTGACTCTAGT
481482483484485486487488489490491492493494495496497498499500501502503504
I S V L Y A S G Y M R N P R L F E R A F P Q N E
I S V L - - - - - - - - - - - - - - - - - - - -
ATAAGCGTGCTA------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E L P Y T M R P Q G L D I I R T W L Y F T M L R
- - - - - M R P Q G L D I I R T . L Y F T M L R
---------------ATGCGACCCCAGGGACTCGACATCATACGCACA---CTCTACTTCACTATGCTCCGG
529530531532533534535536537538539540541542543544545546547548549550551552
V Y Q L L G K P A F R W I R V T G M G L D P T G
V Y Q L - - - - - F . W I R V T - - - - - - - -
GTCTACCAGCTG---------------TTC---TGGATACGCGTAACA------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R T M H K S L G N V I D P E P Y I E T Y G A E P
- T M H K S - - - - - - - - - - - - - - - - - -
---ACTATGCACAAGAGC------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
F R F W A A A A A R L G D D Y R F S E Q V L K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G K L F L T K L W N I S R F V S S F P R P A E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y K L R P I D L A F L G A L N E L I K R V D R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y G E E L D V H Q P I N E L Y N F T W N V F A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
H Y I E I V K T R A Y N R E G E F S E E E Q K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A W Y T L H A I L D A L L R M L A P I L P F I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D A L Y R R L Y G K S V H Q Q Q F P E P N P E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S T D Y A K M L D K I L S L N S A V W S W K R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
H G Y K L S D K V E G Y K L Y V S K D L E P F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K D L S Y M H K I E I V V K E P P P G A E K L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827
D D V Y I A K A Q P S
- - - - - - - - - - -
---------------------------------
Class I
Archaea/Thermoplasma volcanium/amino acid sequences/Val_Arc_T_volcanium_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D L D I D Q M E K K W L K Y W E D N D I Y T F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I P S E R E K V F T I D T P P P T V S G K M H M
- - - - - - - - - T I D T P P . T V S G K M H M
---------------------------ACTATTGATACTCCACCA---ACTGTATCGGGTAAAATGCATATG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G H S F S Y S H I D F I A R Y K R M R G Y H V F
G H S F S Y S H I D F I A R Y - - - - - - - - F
GGGCACTCTTTCTCCTACTCGCACATAGATTTCATAGCAAGATAC------------------------TTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F P W G F D D N G L A T E R Y V E K E T G I K P
F P W G F D D N G - - - - - - - - - - - - - - -
TTTCCATGGGGTTTTGACGATAACGGC---------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T D G N V E H F I N L C R E F S Q A S E K A L I
- - - - - - - - - - - - - - - - Q A S E K A L I
------------------------------------------------CAGGCCAGTGAAAAGGCACTGATA
121122123124125126127128129130131132133134135136137138139140141142143144
E G W K R M G M S C Y F K D Y Y V T S S P E S V
E G W K R M . . . . Y - - D Y Y V T S S - - - -
GAAGGCTGGAAAAGAATG------------TAT------GACTATTATGTTACAAGTTCT------------
145146147148149150151152153154155156157158159160161162163164165166167168
K I S Q S M F L D L V K K N R V Y R D L A P T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R C P T C K T S I S Q I E M K D E M L K S K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y I N F D V E G S K L T I A T S R P E L L G S C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V A L F V N N E D E R Y K N I I G R E A T V P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F G H K V P I M G D E S I D K D F G T G A E M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
C T F G D Q N D L D L W K K Y S L P L R I S I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D G K M N E N A G P L N G L S I N D G R K K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I E L L K S E G F V V K E E D I K H S V N T H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R C G T P V E I F I E K Q W F I R Y L D L K K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F I D S G R A V K W I P D Y M R T R Y E N W V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G L K W D W C I S R Q R Y Y G V P F P V W Y C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D C G N T V F A D D K D L P V D P R L Q P P S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R C D K C G S S N L V P E R D V M D T W A T S S
- - - - - - - - - - - - - - - - - D T W A T S S
---------------------------------------------------GATACATGGGCTACATCGTCA
457458459460461462463464465466467468469470471472473474475476477478479480
L T P R I A L S H F G L F D K Y Y P E D L R G Q
L T P R - - - - - - - - - - - - - - - - L R G Q
CTTACTCCCAGG------------------------------------------------CTGAGGGGGCAG
481482483484485486487488489490491492493494495496497498499500501502503504
G H D I I S F W A F T T I A R S K I H D N T I P
G H D I I S F . A F T T I A R S K I H - - - - -
GGCCATGATATCATATCGTTC---GCTTTTACAACAATAGCCAGGTCAAAGATCCAT---------------
505506507508509510511512513514515516517518519520521522523524525526527528
W L T L M I S G N V F D M Y G E K M S K S K G N
W . T L M I S - - - - - - - - - K M S K S - - -
TGG---ACTTTGATGATAAGC---------------------------AAAATGAGCAAGAGC---------
529530531532533534535536537538539540541542543544545546547548549550551552
I V D I Y A I T D K Y G A D A L R F W A S T V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q G E D I R V K E Q D F V R G R R T V I K M Y N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A N R L I D I L R N G R P L K N V D E P K H P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N L W I L T E E S K V V K L V T D S M D N Y E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S K A R S A L D V F F W N T F C D N Y L E M I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A I V Q A A N E K N D L G T V D E T I Y T A S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
V M R D V V K M Y A P I M P F I T E E I Y Q S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E I E G K K K S V H I D C W P M E N R E Y V E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S E V R Y V T S I I D K I R A A K S N A K V S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
G T P V R K A L I K C N A S I A E K Y R D M L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790
R M M R I G S I D I E D S D K L E V S V E P
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_val_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E M N K E Y D I N I E K E I Q K K W L E Q K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y K F D D D E K R P P Y I I D T P P P Y P T G R
- - - - - - - - - - - - I I D T P P . Y P T G R
------------------------------------TAATAAACCAAATTCAGA---AAATCCATCTTTTAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M H L G H A L N W T Y M D I I A R F K R M N N Y
M H L G H A L N W T Y M D I I A R F - - - - - -
TATTTTTTCAATGGTTTCATTGTCTGCATTTTTAACGAAATCCATAACTTTTTT------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D V L F P Q G W D C H G L P T E V K V E E I H G
- - L F P Q G W D C H G - - - - - - - - - - - -
------TATTTTTGATTTATTTGGTATGATTTCAGA------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I T K T D I D R H E F R K L C I E L T D E N I E
- - - - - - - - - - - - - - - - - - - D E N I E
---------------------------------------------------------CTCATAATCATGGTT
121122123124125126127128129130131132133134135136137138139140141142143144
K M R E Q I N S L G I S I D W D R E Y I T M S P
K M R E Q I N S L . . . . D - - R E Y I T M S -
GTTGGTGTATATCTCAACGCGTTCCAA------------AGG------TTTATTAGATTTATATCTTCT---
145146147148149150151152153154155156157158159160161162163164165166167168
E Y V K K S Q T A F V K M H K D N L V Y R G K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P V N W C P R C Q T A I A F A E V E Y K D R K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y L N H I K F T Y A E D E N K Y L E I A T S R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E L L A A C V G I V V N P E D K R Y E D V V G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T V K V P L F N H E V K V Y P D K D V E M D F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T G V V M V C T F G D K T D V V W V N R H N L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V K E A I T E K G E L S E I C G K Y A G M T T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D A K K Q I I N D L K E E G Y L I K Q D P L E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N V G V C W R C K T P I E I I V G D Q W F V N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K E L L D M V E K A T N E I K W T P E H M K T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L L Q W I K D M G W D W C I S R Q R L F A T P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P V W Y C K D C G E V I V A K E E D L P I D P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K E C P Y T C K C G N K N L T P E T D V L D T W
- - - - - - - - - - - - - - - - - - - - - D T W
---------------------------------------------------------------ATCCAATAC
457458459460461462463464465466467468469470471472473474475476477478479480
M D S S I T P M A I T E W E T N N E F F N K R Y
M D S S I T P M - - - - - - - - - - - - - - - -
ATCTGTTTCAGGAGTTAAATTTTT------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P V Q L R P Q G H D I I R T W A F Y T I I K S I
- - - L R P Q G H D I I R T . A F Y T I I K S I
---------CTCCTTAGCTACAATTACTTCCCCACAATCTTT---ATACCATACTGGAATTGGTGTAGCAAA
505506507508509510511512513514515516517518519520521522523524525526527528
A L T D K K P W D E I V I N G M V F G E D G H K
A L - - - - - W . E I V I N - - - - - - - - - K
TAATCT---------------CCA---CCAACCCATGTCTTT---------------------------ATG
529530531532533534535536537538539540541542543544545546547548549550551552
M S K S R G N V V E P F E I T K D Y G A D A L R
M S K S - - - - - - - - - - - - - - - - - - - -
TTCAGGAGTCCA------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L W A S N S T I G N D V P F A W K E V D Y G Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
F L R K F W N A S R F A K M N L D D E T I E T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K N S I N D S K I K L I V G G N D V E I S N P C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
N C V N V D N P V D L W I L S K L N R L I E N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S N D L E N Y K F N T V G D I E K F V W H D L C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
D N Y I E M V K Y R L Y N K E D S E K A K I S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
F N A Q Y T L Y T V I T T V L K L M A P F T P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
F S D I V G E I Y K I D D L H G S W C K V D K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S I S Q E N E N D G E I A K N T I V S I R R Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S N K G M P L N A P L E R V E I Y T N N H D Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
G L L K V V E D I K G T L N I N E L K I I N G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
P E L E H K I S E I I P N K S K I G P E F K K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S K K V M D F V K N A D N E T I E K I L K D G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E S E F G L L T K E H V K D V K R A L F S G G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906
I V E T V N I D G L I D S I A I I Q
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_val_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L S Q D E I N K K L E E W P K H Y D P K G I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L K W Q N L W M T K E F W E K V F R F R D E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K S P V F V I D T P P P F T S G E L H M G H A Y
- - - - - V I D T P P . F T S G E L H M G H A Y
---------------TATAGCTAACCTATTTTG---TTTAAGTGTCCTTATTGCTGAAGTTGCTTTTTTGAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W V T I S D T I G R F K R L E G Y N V L L P Q G
W V T I S D T I G R F - - - - - - - - L L P Q G
ATATTCTCCTAATTTCTGTGCTTCTCTATCATC------------------------GTTCTCTAGGGTTAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
W D T Q G L P T E L K V Q Y K L K I P K E N R E
W D T Q G - - - - - - - - - - - - - - - - - - -
ACTCATCTTATCACC---------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L F L K K C I E W T E D M I R S M R T A M I R L
- - - - - - - - - - E D M I R S M R T A M I R L
------------------------------ATATATTGCTGACTCATCCTCCATAAATAACCTGTGTTTTAT
145146147148149150151152153154155156157158159160161162163164165166167168
G Y R A E W E R F E Y R T Y E S K Y R R I I Q K
. . . . E - - R . E Y R T Y E - - - - - - - - -
------------CTC------AAT---TTCCCAGAAATAAGAATA---------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L I D M H K M G L V E M R E G P V Y W C P K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E T A L A Q S E V G Y K E E D G V L A Y I L F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F V D G E G G V T I A T T R P E L L G A T Q A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A V N P D D E R Y K S L V G R K V K I P I F D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E I S I I A D K A V E M T F G T G A V M I S T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G D P Q D I R W Q L T Y R L P V Y E V V D D K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K I K N T N G L L D G L T V K E A R K K I I E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L K E K G Y L I K V E K I T H N V L A H T E R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D C L S P I E F L I K K Q I Y I K V L E W R N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L L E D Y K K M K F T P Q R M S Y Y L E E W I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N L E W D W N I S R Q R V Y G T P I P F W Y C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N G H L I P A S E E V L P I D P S K V N P P I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K C P H C G L D L K P V K D V A D V W V D S S V
- - - - - - - - - - - - - - - - D V W V D S S V
------------------------------------------------CAGATAACCTTTTTCTTTTAATAT
481482483484485486487488489490491492493494495496497498499500501502503504
T V L Y L T G F Y D D K S R F T K T F P S S L R
T V L - - - - - - - - - - - - - - - - - - - L R
TTCAATAAT---------------------------------------------------------CTTTCC
505506507508509510511512513514515516517518519520521522523524525526527528
L Q G T D I I R T W L F Y T Y Y R T L A L A G N
L Q G T D I I R T . L F Y T Y Y R T L A L - - -
CTTATCATCTACGACTTCATAAACAGG---CCTATACGTTAATTGCCAACGGATATCCTGAGG---------
529530531532533534535536537538539540541542543544545546547548549550551552
I P F K E V L I N G Q V L G P D G T R M S K S K
- - F . E V L I N - - - - - - - - - R M S K S -
------TAT---TACAGCTCCAGTTCC---------------------------AATTATACTGATTTC---
553554555556557558559560561562563564565566567568569570571572573574575576
G N V V S P L D K V D E Y G A D A I R L T L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A K I G D D F P F K W D T V K S K K L L L Q K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
W N A G R L S Y P F I G K K K V N K P S K I H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
I D K W I L Q E H K K F V Q Q S I E A Y R N Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
F Y I V V E S I Y S Y F W E T I A D E Y L E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
K H R L F M E D E S A I Y T L S R I I K D L L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L L Y P I A P H I T E E M Y E R L Y G D K M S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
T L E N L P D I S D L E D D R E A Q K L G E Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
K K A T S A I R T L K I Q N R L A I P T P I S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
K I Y G P D D F I A K I K I I E E D L K K T L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814
L I D I I Y Q E N N E I K V E L L S D H G S
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_val_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A H R L P T R W D I K W E E E L L K L W E K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G R F K T K I S G S R P V F V I D T P P P Y L S
- - - - - - - - - - - - - - V I D T P P . Y L S
------------------------------------------GTCATTGACACTCCTCCG---TACCTCTCA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S N R P H I G Q T A S Y A H F D M I A R F L R M
. N R P H I G Q T A S Y A H F D M I A R F - - -
---AACAGGCCGCATATAGGCCAAACCGCCTCCTACGCTCATTTCGACATGATAGCCAGGTTT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R G V D V I F P F Y L D R N G L P I E V Q V E K
- - - - - I F P F Y L D R N G - - - - - - - - -
---------------ATATTCCCGTTTTACCTTGACAGAAACGGC---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K Y G V V A H E I P R E K F I K M C K E E L D S
- - - - - - - - - - - - - - - - - - - - - - D S
------------------------------------------------------------------GACAGC
121122123124125126127128129130131132133134135136137138139140141142143144
Y E G E F V S S L R R W G L S F D Y W P N G T D
Y E G E F V S S L R R W . . . . D - - P N G T D
TACGAGGGAGAGTTCGTCTCTTCGCTCAGGCGCTGG------------GAC------CCTAACGGCACGGAC
145146147148149150151152153154155156157158159160161162163164165166167168
S P E Y R R M T Q K T F I E L W H K G L V Y E A
S - - - - - - - - - - - - - - - - - - - - - - -
AGC---------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E R P T P W C P R C R T A L A E P E I E Y R E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E T Y L N Y I K F K V K E T G E D I I I A T T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P E L L P A T V A V I F H P D D S R Y T R L N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
M H A V V P P E G Q V V P I L P H K A A N P N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G S G L V M I S T F G D T R D L M I V N E L K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P I R I I I D E G G R I K T G K Y A G V S I R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A R A K I I E D L K N A G L L V K Q E R L V H N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V P V C W R C K T P L E I I V T R E L F I K Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E F K E K L I E L A G K M E F K P P E Y R Q V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I D W I K S L E L D W P V S R R R Y Y A T E I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I W W C A K P N G E R V P L L P K G G E Y Y V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
W R D E P P P E V K E A C K D G R L E G D T R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F D T W F D S S I S W M Y A S G V T K D F N A F
- D T W F D S S I S W M - - - - - - - - - - - -
---GACACGTGGTTTGATTCGTCTATTTCGTGGATG------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S K V Y P H S I M R P Q G Y D I I R T W L Y Y S
- - - - - - - - M R P Q G Y D I I R T . L Y Y S
------------------------ATGAGGCCTCAGGGTTACGACATTATAAGGACT---CTGTACTACTCC
505506507508509510511512513514515516517518519520521522523524525526527528
L L R A Y L L Y G D V P F R Y V R I N G M G L D
L L R A Y L L - - - - - F . Y V R I N - - - - -
CTCTTAAGGGCGTATTTGCTA---------------TTC---TACGTGAGAATTAAC---------------
529530531532533534535536537538539540541542543544545546547548549550551552
E K G E A M H K S K G N V I D L L A P V E K Y G
- - - - A M H K S - - - - - - - - - - - - - - -
------------GCCATGCATAAATCA---------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A D P V R F W A A A A G R L G T D Y R Y N E N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I R E G K E F L T K V W N I S R F V L S F P E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q Q K P Q L A P V D R A L L A R L Y D V A K K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
I T A Y S E F D V Y E P A H A L Y N F I W H E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A D H Y I E L V K S R A Y N R E G V F T E E E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R A A I W T L Y T A W R Y S L K L L A P I M P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V T D K I W R E A Y G R S I H D E M I E D P P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E W K E G D Q A L F H L V K K I N S A V W R Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
N R R G M S L A D R L D A V L Y V S E L A M Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A K D L K Y M H K V S D V R P G R G A E Q I D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799
E G L V W L G
- - - - - - -
---------------------
Class I
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_val_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D I D V N Q M E E K W I R Y W D E K D V Y R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E P A D R D K V F A I D T P P P T V S G K M H M
- - - - - - - - - A I D T P P . T V S G K M H M
---------------------------ATCTTTTCTTCCTTTTAC---TGCTACCTTCACCCTGGTTCCAAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G H S F S Y P H I D F I A R Y K R M R G Y H V F
G H S F S Y P H I D F I A R Y - - - - - - - - F
GGACACCTTTGCTGCTGATTTTGCAGATCTTATCGCATCGATCAC------------------------ATT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F P W G F D D N G L P T E R Y V E K E T G I K P
F P W G F D D N G - - - - - - - - - - - - - - -
GGCATCGCTGTATCTGCGCTTCTCATC---------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S D S N V E E F I R L C K E I S E S S E K S L L
- - - - - - - - - - - - - - - - E S S E K S L L
------------------------------------------------CGCCTTTGCCACATCCAGCATGAC
121122123124125126127128129130131132133134135136137138139140141142143144
E G W K R I G M S C Y F K D Y Y V T S S P E S I
E G W K R I . . . . Y - - D Y Y V T S S - - - -
CTTTGAAGCCGTATAAAC------------CGT------GTCACCGGCTGCAGAAGCCTT------------
145146147148149150151152153154155156157158159160161162163164165166167168
R I S Q S M F L D L V R K G R V Y R D L A P S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R C P T C K T S I S Q I E M K D Q E M H T K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y I N F S V G D R P L T I A T T R P E M L G S C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V A V F V N P D D A R Y R D L I G K E A T V P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F G N H V R I M A D A S V D M N F G T G A E M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
C T F G D Q N D L D L W K K Y N L P L K I S I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D G R M T E E A G P L K G L S I S D A R K K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V E I L R E G G H V V K E E S I K H S V N T H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R C G T P I E I F I E K Q W F I K Y L D L K D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F I E N G R K I E W T P E Y M R V R Y E N W V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G L K W D W L I S R Q R Y Y G V P F P V W Y C A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D C G N T V Y A D E S E L P V D P R I Q K P S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K C D R C G S T N L V P E R D V M D T W A T S S
- - - - - - - - - - - - - - - - - D T W A T S S
---------------------------------------------------CTCTATGGGTGTTCCGCACCT
457458459460461462463464465466467468469470471472473474475476477478479480
L T P R I A L T H F G L F D K Y Y P E D L R G Q
L T P R - - - - - - - - - - - - - - - - L R G Q
CTCATGGGTGTT------------------------------------------------GAGAATCTCTAC
481482483484485486487488489490491492493494495496497498499500501502503504
G H D I I S F W A F T T I A R S K I H D D R I P
G H D I I S F . A F T T I A R S K I H - - - - -
TATCTTCTTCCTCGCATCCGA---GCTCAGGCCTTTGAGCGGCCCAGCTTCCTCAGT---------------
505506507508509510511512513514515516517518519520521522523524525526527528
W F R I M I S G N V Y D M Y G E K M S K S K G N
W . R I M I S - - - - - - - - - K M S K S - - -
GTC---GCTGATCTTCAGTGG---------------------------GTCATTCTGGTCGCC---------
529530531532533534535536537538539540541542543544545546547548549550551552
I V D I Y S M I D K Y G A D A L R F W A S T V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q G D D I R I K D Q D F T R G R R T V I K M Y N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A K K L I D I L K G D R K I R L F E D V K H P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N R W I L T E D S R I M E T I T T H M D N Y E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S K A R T A L D T F F W N V F C D N Y L E M I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
P I I Q K A S A A G D Y D T V D E T V Y T A S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
V M L D V A K A Y A P I M P F I A E E I Y Q T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
D F P G R K I S I H V D S W P D E K R R Y S D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
N E E V S Y I V S V I D A I R S A K S A A K V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V G T R V K V A S V K G R K D L I E K Y R D L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791
S G M L R I D S M E I A D G D A V D A T V F P
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class I
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_val_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L P K N Y D P N E I E P K W Q K Y W L E E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y K Y R L D E N K P S Y A I D T P P P F T S G T
- - - - - - - - - - - - A I D T P P . F T S G T
------------------------------------GCTATAGATACGCCACCA---TTCACGAGCGGTACC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L H L G H V L S H T W I D I I A R Y K R M R G Y
L H L G H V L S H T W I D I I A R Y - - - - - -
CTGCACCTCGGTCACGTGCTTAGTCATACCTGGATTGATATTATAGCTAGATAC------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N V L F P Q G F D N H G L P T E L K V E K E F G
- - L F P Q G F D N H G - - - - - - - - - - - -
------CTCTTTCCCCAGGGATTCGATAATCATGGA------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I T K D Q P E E F L K K C V E W T W Q A I E A M
- - - - - - - - - - - - - - - - - W Q A I E A M
---------------------------------------------------TGGCAGGCTATAGAAGCAATG
121122123124125126127128129130131132133134135136137138139140141142143144
R K Q F I R I G Y S A D W D L E Y H T M D D W Y
R K Q F I R I . . . . D - - L E Y H T M D - - -
AGAAAGCAGTTTATAAGGATA------------GAC------CTTGAATATCACACGATGGAT---------
145146147148149150151152153154155156157158159160161162163164165166167168
K A A V Q R S L L E F Y K K G L I Y R E E H P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y W C P K C R T S L A K A E V G Y V E E E G Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y Y I K L P L A D G S G Y I P I A T T R P E L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P A C V A V F V H P D D E R Y K H L V G K K V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L P I F E R E V P I L A D E D V D P N F G T G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V Y N C T Y G D E Q D I V W Q K R Y N L P V I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V I N E D G T M N E N A G P Y A G L K I E E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K K I A E D L E K M G L L Y K K E K I K H R V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R H T E R S S C M A P I E L L P K K Q W F I K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K D L I D E I I K V A K E I N W Y P E D M F L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L K D W A E S M D W D W V I S R Q R V F G T P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P F W V C K N G H I I P A R E E D L P V D P R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D K P P V D K C P V C G A E I E P V T D V L D C
- - - - - - - - - - - - - - - - - - - - - - D C
------------------------------------------------------------------GATTGC
457458459460461462463464465466467468469470471472473474475476477478479480
W V D S S I T P L I I T K W H E A I K G D E E A
W V D S S I T P L - - - - - - - - - - - - - - -
TGGGTTGATTCCAGTATAACTCCACTC---------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K K W F E H N F P T A L R P Q G T D I I R T W A
- - - - - - - - - - - L R P Q G T D I I R T . A
---------------------------------CTTAGACCCCAGGGAACAGATATAATAAGGACT---GCC
505506507508509510511512513514515516517518519520521522523524525526527528
F Y T I L R T Y V L T G K K P W K D I V I N G M
F Y T I L R T Y V L - - - - - W . D I V I N - -
TTCTACACGATACTCAGAACTTACGTCTTA---------------TGG---GATATAGTGATAAAC------
529530531532533534535536537538539540541542543544545546547548549550551552
V A G P D G R K M S K S Y G N V V S P E E V I P
- - - - - - - K M S K S - - - - - - - - - - - -
---------------------AAGATGAGCAAAAGC------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K Y G A D A L R L W T A L A P P G E D H P F K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E T V D Y N Y R F L Q K V W N I Y R F A E R H I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K D F D Y E K Y R D V E L E P L D K W I L S R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
H R I I K F A T E E L E R Y R F N L I T R E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
T F I W H E V A D D Y I E M I K Y R L Y G E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E S K L K A K V A L Y E L L Y N V M L L L A P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V P H I T E E I Y H A I F K E K I G E K S V H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L S W P E Y R E D R I D E E A E K I G E L A R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
I V S E M R K Y K N S H G L P L N A K L K H V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I Y A L D S Y E R L K L I E R D I A G T M N I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
R L E I V K G E P H L E E R I V E V K P N Y K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I G P K Y G K L V P R I V Q Y L R E N A E S I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R E I K E K G K A E F E V E G K K V E L T K E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
I T V R K E V F S E G E K V E T S V V D D V V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891
V F F
- - -
---------
Class I
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_val_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T E L P D S Y D P D R I E P K W Q D E W E G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D V Y E Y D P S D A D T S Y I V D T P P P Y P T
- - - - - - - - - - - - - - I V D T P P . Y P T
------------------------------------------CTGCCCGTCGGACTCGAC---GACGGTGTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G N L H L G H G L Q W S Y I D F V A R F R S L Q
G N L H L G H G L Q W S Y I D F V A R F - - - -
CCCGGAGTGGATCTGTGCCTGTATCTCCGCGGGGTCGGCGGCGTCGAGGGCCGCCATCAC------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G D A V L F P Q G W D C H G L P T E V K V E E N
- - - - L F P Q G W D C H G - - - - - - - - - -
------------GGGGCCGATCTTCGAGTCCTCGCCGTCGAC------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H D I H R T D V S R E E F R E M C V E H T E E R
- - - - - - - - - - - - - - - - - - - - - E E R
---------------------------------------------------------------GTCGTCGCC
121122123124125126127128129130131132133134135136137138139140141142143144
I D G M K Q T M R E L G F S Q D W N A E Y R T M
I D G M K Q T M R E L . . . . D - - A E Y R T M
GTCGAAGTAGAGTTCGATGCGGTCGAGGTCGGC------------CCC------GGACTTCCACGCGCGGAT
145146147148149150151152153154155156157158159160161162163164165166167168
D P E Y W G K T Q E S F V R M A D D G M V Y R D
D - - - - - - - - - - - - - - - - - - - - - - -
CTC---------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E H P V N W C P R C E T A I A D A E V E N V D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q G T L Y Y V T F D G V G N D D I E I A T T R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E L L A A C V G M A V S P D D E R Y E D R I G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T F E V P L F G Q E V E L V A D A D V D P E F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T G A V M I C T F G D K Q D V D W W A E Y D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L R P V F T E D G H L N D L A G E F A G L D I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E A K D E I A D A L D D A G R L G D T E S T E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N V G A C W R C D T P I E I L S K E Q W F V E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D Q D L V L E K G A E V E W I P E H M H D R L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D W T E G M E W D W V I S R Q R V F A T P I P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W Q C N D C G H W H I A S E A E T P V D P T E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G P A L D D C P E C G A D E W T G E R D V M D T
- - - - - - - - - - - - - - - - - - - - - - D T
------------------------------------------------------------------GGTCTC
457458459460461462463464465466467468469470471472473474475476477478479480
W M D S S I T P L H I S G W P E E I D L D E F E
W M D S S I T P L - - - - - - - - - - - - - - -
CGCTTCGCTCGCGATGTGCCAGTGGCC---------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P V G L R P Q G H D I I R T W A F Y T L L R T G
- - - L R P Q G H D I I R T . A F Y T L L R T G
---------GATGACCCAGTCCCACTCCATGCCCTCCGTCCA---GACGAGGCGGTCGTGCATGTGCTCGGG
505506507508509510511512513514515516517518519520521522523524525526527528
A L T D E K P W D D A L I N G M V L D P D G K K
A L - - - - - W D . A L I N - - - - - - - - - K
AATCCA---------------CTTCTC---GACGAGGTCCTG---------------------------CGA
529530531532533534535536537538539540541542543544545546547548549550551552
M S K S S G D A V T P D E A I A E Y S A D A L R
M S K S - - - - - - - - - - - - - - - - - - - -
GAGAATCTCGAT------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q A L A L G G Q P G S D V Q F Q W K E V K S A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R F L T K L W N I V K F A E G H F D E D T P D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A D P A Y R D A D R W L L S E L T R V S E D V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S E M A D Y R F D A A L R R L R E F V W E D L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D D Y V E L V K G R L Y N G R P G E R D A A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
T I Y T A V T A V V R M L S P F S P H A A E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
W T S L P G T E G S V Y S A A W P D V D L L D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D A E V A G R R I A E T A S E I R A W K S E Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
M P L N A D L D R I E L Y F D G D D S H L D T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
D L S E T V N A P I K L A S G R P D I E L V P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
D V D G E D S K I G P E F R S D A G A V M A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
D A A D P A E I Q A Q I H S G D T V T V E S D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
Q A F D L D S E W L T V D E E Y R A A S G E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878
A V V E T S F G T V L V Y E
- - - - - - - - - - - - - -
------------------------------------------
Class I
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_val_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T E S E I P K E Y N A N E V E E K W M E K W N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L S M Y H F N W G E D P R P Q Y I I D T P P P Y
- - - - - - - - - - - - - - - - I I D T P P . Y
------------------------------------------------ATTATTGATACCCCACCT---TAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P T G N F H I G N A L N W C Y I D Y I A R Y K R
P T G N F H I G N A L N W C Y I D Y I A R Y - -
CCTACAGGCAATTTCCACATCGGAAACGCGCTCAACTGGTGTTACATCGACTATATAGCCAGATAC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M R G Y N V M F P Q G W D C H G L P T E V K V E
- - - - - - M F P Q G W D C H G - - - - - - - -
------------------ATGTTCCCCCAGGGCTGGGACTGCCACGGC------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E I H G I T K N Q V P R A E F R K M C R E L T A
- - - - - - - - - - - - - - - - - - - - - - - A
---------------------------------------------------------------------GCA
121122123124125126127128129130131132133134135136137138139140141142143144
G N I E K M R K T M L R L G F S V D W S N E F V
G N I E K M R K T M L R L . . . . D - - N E F V
GGAAACATCGAAAAGATGCGCAAAACAATGCTGCGTCTG------------GAC------AACGAATTCGTT
145146147148149150151152153154155156157158159160161162163164165166167168
T M E P S Y F V K T Q K S F V R M Y N D G H I Y
T M E - - - - - - - - - - - - - - - - - - - - -
ACCATGGAG---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
H E D H P V N W C P R C E T A I A F A E V E Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S R Q T K L N F V H F D K V D I A T T R P E L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A A C V A V A V N P K D E R Y S Q H I G K E I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V P I F G Q K V T L I A D E A V E P E F G T G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V M I C T F G D K Q D V R W W V K Y G L P L V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A L D K Q G R M T K A A G K Y E G M T L A E C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E A V I A D L K A A G F L Y D Q K S L E Q N V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L C W R C D T P I E I L S E P Q W F V K I N H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G I L K A A D E I K W Y P E Y M K V R L Q N W T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G T M E W D W C I S R Q R I F A T P I P I W Y C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K K C G E V M I A E E S W L P I D P N E N T P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K A C A C G S T E F E P E T D V L D T W M D S S
- - - - - - - - - - - - - - - - - D T W M D S S
---------------------------------------------------GATACCTGGATGGACTCCTCG
457458459460461462463464465466467468469470471472473474475476477478479480
I T A L H V S G W E S E H E M R L P T Q I R P Q
I T A L - - - - - - - - - - - - - - - - I R P Q
ATTACTGCCCTC------------------------------------------------ATCCGTCCCCAG
481482483484485486487488489490491492493494495496497498499500501502503504
G H D I I R T W A F Y T I L R S L A L E G K R P
G H D I I R T . A F Y T I L R S L A L - - - - -
GGACATGACATCATCAGGACC---GCTTTCTATACAATCCTTAGGAGTCTGGCCCTT---------------
505506507508509510511512513514515516517518519520521522523524525526527528
W D S I V I N G M V L G P D G H K M S K S L G N
W . S I V I N - - - - - - - - - K M S K S - - -
TGG---TCCATAGTGATCAAC---------------------------AAGATGAGCAAGTCC---------
529530531532533534535536537538539540541542543544545546547548549550551552
V I S P E E V T T Q Y S A D A F R Q W G A V G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
S T G S D V M F R W K D V V S A S R F L Q K M W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
S I Y R F S M S H L K D F E P A D A E N F P P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A L L T I D R W L L S K L N K L V D T A T K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D G Y Q F D S T F K A I R G F A W E V L A D N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L E L V K G R L Y G E D P E G R K A A Q Y V L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
T T T R T L S L L L A P F I P F F A E E M Y S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
F S E E S V H T Q T W P A V N E K L I S E E A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A A G E M I K E I T G E V R R Y K S D L G M A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
N A P L K K I E I Y N A E I D T G D I A G A T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S E V E L M A G A P S F E Y V P V E V K P N M G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
F L G P R F R K E A G A V V K A L Q A E D P A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I E A Q A A S G K I T I T V N G E A V K L E P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A V E I R K E V I S G G R E V D V L D V K G A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869
V V I V R
- - - - -
---------------
Class I
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_val_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S R V L R E L P K T Y D Y R E V E A R W Q Q T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W K D E D V Y F K E G S E K P Q F V I D T P P P
- - - - - - - - - - - - - - - - - V I D T P P .
---------------------------------------------------GTCATTGATACGCCACCA---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y P T G E F H I G N A F N W C Y I D F L A R Y K
Y P T G E F H I G N A F N W C Y I D F L A R Y -
TACCCAACCGGGGAATTTCATATCGGAAATGCATTCAACTGGTGTTATATCGACTTTTTAGCCAGATAC---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R M K G Y N V M F P Q G W D C H G L P T E V K V
- - - - - - - M F P Q G W D C H G - - - - - - -
---------------------ATGTTCCCGCAGGGGTGGGACTGCCATGGC---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E I H K I T K N D V D R Q K F R E M C R E L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I G N I R K M R A S M R R M A F S I D W S H E Y
I G N I R K M R A S M R R M . . . . D - - H E Y
ATTGGCAATATCAGGAAGATGCGGGCATCCATGCGCAGGATG------------GAC------CACGAATAC
145146147148149150151152153154155156157158159160161162163164165166167168
I T M M P E Y F G K T Q L S F L R M Y H A G Q I
I T M M - - - - - - - - - - - - - - - - - - - -
ATCACCATGATG------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y Q S D H P V N F C P R C E T A I A F A E V N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S D R T T K L N Y F N F S G L E I A T S R P E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L A A C V A V A V H P D D D R Y K D R K G E H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K V P L F G H E V P I I C D E A V D P S F G S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A V M I C T F G D K Q D V I W W K V H N L P L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K A I D K T G H M T Q I A G K Y E G M D T T S C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R E A I L A D M K S E G I L L R Q E P L E Q R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G T C W R C K T P I E I L S E H Q W F V R I P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E A A L K A A K E V K W Y P E H M F L R M E N W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I S Q M E W D W C I S R Q R I F A S P I P V W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
C K D C G E I I L P E E S E L P V D P T V D A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K R P C P K C G S S N Y I P E T D V L D T W M D
- - - - - - - - - - - - - - - - - - - D T W M D
---------------------------------------------------------GATACCTGGATGGAC
457458459460461462463464465466467468469470471472473474475476477478479480
S S I S V M H V T G W D G T Q K V P P L F P A Q
S S I S V M - - - - - - - - - - - - - - - - - -
TCTTCCATCTCGGTGATG------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I R P Q G H D I I R T W A F Y T I L R A V S L T
I R P Q G H D I I R T . A F Y T I L R A V S L -
ATTCGTCCACAGGGCCATGATATCATTCGGACT---GCATTTTACACGATACTTCGTGCAGTATCCCTC---
505506507508509510511512513514515516517518519520521522523524525526527528
G G K P W E Q I L V N G M V L G E D G F K M S K
- - - - W . Q I L V N - - - - - - - - - K M S K
------------TGG---CAGATCCTGGTAAAC---------------------------AAGATGAGTAAG
529530531532533534535536537538539540541542543544545546547548549550551552
S R G N V T V P E E I L E Q Y G A D S L R Q W A
S - - - - - - - - - - - - - - - - - - - - - - -
AGC---------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A L G A A T G S D I Q F N W N D V V A A N R F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
T K M W N I S R F A L M Q L D R A Q Y K A D A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
V T A L A D R W L L T K L S Q T V R D V S E S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E T Y Q F D K A L K A I R E F A W D V L A D N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I E I V K G R L Y S D S D T R D G A C V A I R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S M D A I C R M L A P F T P Y F A E E V W S F M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E E S S V H Q Q P W V T F S Y E D E E A V R S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E I L V Q V I S E I R R Y K H D K G L A L N A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L G N V T V Y T T L A V D D A G D A S T A S N C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
T L T W K T G M P E L T Q V V S G V K F D M G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
I G P K L R G K A K G F M Q A I E A L P K E S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
T S V P A M I T V D G E E I A V P E G S V I P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L S Y T V A G A S V D L I P V S D S L V I T I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865
Q
-
---
Class I
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_val_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P Y N P K E I E Q W Y K E N Y K Y F F G E G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K I L I I D T P P P Y P A P L W H I G A A L S Y
- - - I I D T P P . Y P A P L W H I G A A L S Y
---------ATTATTGATACTCCCCCA---TACCCAGCACCATTATGGCATATAGGAGCGGCTTTAAGTTAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A L Q D F I A R G F R K L G Y K V I F P E G F D
A L Q D F I A R G - - - - - - - - I F P E G F D
GCTTTACAAGATTTTATTGCGAGGGGT------------------------ATATTTCCTGAAGGCTTTGAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G N G I P I E M Y L E K Y E K I P F G S I D R E
G N G - - - - - - - - - - - - - - - - - - - - -
GGGAATGGT---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E Y I K K C R Q I L D S W R E K M D K I L K D L
- - - - - - - - - - D S W R E K M D K I L K D L
------------------------------GATAGTTGGAGAGAAAAAATGGACAAAATCCTAAAAGATCTA
121122123124125126127128129130131132133134135136137138139140141142143144
L L S M D F E H R Y N T D D P E Y R A L T Q K T
. . . . D - - H R Y N T D D - - - - - - - - - -
------------GAT------CATAGATACAATACAGACGAT------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F A E L W E K G L I Y E A E Y P I N Y C P H C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T A I A D A E I E R K I K K T K L V Y I K F K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K D S D D Y I T V A T T R P E L L G A C K A I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V H P D D E R Y K K Y H N K I A I V P Y Y N R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I P I I P H K M A D P N F G T G A V M I C S Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D W V D V Q I F R E L Q L K P E K I I D E N G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L T I E P V K G L T T K E G R E K M I E V L K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L G V V E K I E E I E H S V P V H E R C E T E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E I I P M K E F Y L K Q L P F K E E I K K L S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E I E F I P E R Y R K N L E N W I D S I T I D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P I S R R R W Y A T E I P L W Y C P K C G Y I H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V A K D G K Y H Q P W K E E M V C P R C N T K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V G E T R V L D T W M D S S I T I Y Y L I K K Y
- - - - - - - D T W M D S S I T I Y - - - - - -
---------------------GATACTTGGATGGATTCCTCTATTACAATCTAT------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S K I L G I D E E G L F N N Y T L R P Q G Y E I
- - - - - - - - - - - - - - - - L R P Q G Y E I
------------------------------------------------TTAAGACCCCAAGGCTACGAAATA
481482483484485486487488489490491492493494495496497498499500501502503504
I R T W L Y Y T L L R V Y Q L T G K K A F D F V
I R T . L Y Y T L L R V Y Q L - - - - - F . F V
ATTAGGACT---CTATACTATACTTTATTAAGAGTATACCAACTA---------------TTC---TTTGTT
505506507508509510511512513514515516517518519520521522523524525526527528
V I N G M G L D K H G R K M S K R Y G N V I E P
V I N - - - - - - - - - K M S K R - - - - - - -
GTAATCAAT---------------------------AAAATGAGTAAAAGA---------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E T L L E K Y G A D T L R Y W F A M E I S I G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D Y R I N E Q K I A G I M K F M N K V W N I A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Y I S Q Y Q Y R E T Q N L K P T D E W I I N Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K Y L E N K A I E Y I R N F E F N K L A R E L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
R F V W D V F A N H Y I E L T K K R A K N N D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S A I Y A L Y F V F E R V L N M L S I F S P G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A K Y L A K K L Y N K D I E K E K L K Y W G K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
R L D L L Y K G E K L I E F N N Y V W K L K T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Q G K K L K D P I S I E I P K E L E I F K E D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751
I L L H N I Q
- - - - - - -
---------------------
Class I
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_val_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A G E P L L K T E R V R K V Y D P Q E I E P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W Y A Y W E A N N F F R A E I R P D R T P F V I
- - - - - - - - - - - - - - - - - - - - - - V I
------------------------------------------------------------------TTCCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M M P P P N V T G R L H M G H A L Q D T I Q D A
M M P P . N V T G R L H M G H A L Q D T I Q D A
AAACCGTTCTTT---GGCGATTTCTTTTTCCAGCCGCGCCCGCTCCTGCTCCAGATCGATCACGTCGGCCAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L T R I R R M Q G Y E A L W L P G I D H A G I A
L T R I - - - - - - - - L W L P G I D H A G - -
CGGCACGTACAC------------------------CGCACTGGCCTTTGGCCGCTCCAGCCCCAT------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T Q N V V E R E L R D K E G K T R H D L G R E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F L Q R V W R W K E E Y G D I I L Q Q K R R L G
- - - - - - - - - E E Y G D I I L Q Q K R R L .
---------------------------CCGGATCTCCCGGCCGGGCGGCACGCCGTAGGTGCTCCGCAC---
145146147148149150151152153154155156157158159160161162163164165166167168
D S C D W S R T R F T M D E G F T R A V Q E A F
D - - - - - R - R F T M D - - - - - - - - - - -
CCG---------------CTC---GATGCGGCCGAAGCG---------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I R L Y N E G L I Y R G D Y L V N W C P V D Q T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A L S D E E V D N V E Q D G H L W Y I R Y P L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D G S G Y I T I A T T R P E T M L G D T A V A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H P E D E R Y R H L I G K K V R L P L L G R E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P I I A D E H V K R D F G A G A L K I T P G H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K N D F E I G Q R H G L P I I N I M N P D G T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N E N G G P Y A G L D R F E A R K R I V E D L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A Q G L L E K V E P Y R H T V P I S S R S K A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I E P M L S R Q W F V R M R P L A E P A I E A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R R G E I R F Y P E R W A N E Y F R W M E N I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D W C I S R Q I W W G H R I P V W Y Y T D E N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q I D E S K G F V V S I E Q P E P G M V Q D E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V L D T W F S S W L W P F A T L G W P D Q T P D
- - D T W F S S W L W P F - - - - - - - - - - -
------CTTCGACTCGTCGATCTGGCCGTTTTCGTCCGT---------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L A Y F Y P T T V L V S G Y D I L F F W I A R M
- - - - - - - - V L V S G Y D I L F F . I A R M
------------------------GCGGATGTTTTCCATCCAGCGGAAGTACTCGTT---CCACCGCTCCGG
505506507508509510511512513514515516517518519520521522523524525526527528
I M A G I H F T G K I P F R D V F I T G M V K D
I M A G I H F - - - - - F . D V F I T - - - - -
ATAAAACCGGATCTCTCCCCG---------------GGC---CTCGGCCAGCGGCCT---------------
529530531532533534535536537538539540541542543544545546547548549550551552
K Y G R W M S K S L G N G I D P L E M I D Q Y G
- - - - W M S K S - - - - - - - - - - - - - - -
------------CATCGGCTCGATGAT---------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A D A V R Y S L T V L C T Q G Q D I K L D P S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
F E M G R N F A N K I W N A F N V F G Q F M E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D D E G R P L R D Y R R Q R R F E E L S L V E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
W M V T R L N Q T I A T V N E A I D R Y R L N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A L L T I Y D L F W G D Y C D W Y L E L I K P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R G Q A M D D E T I A L A V E L Y E K M I Q L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
H P F M P F I T E A L W W R L R P R G E R E A C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
I V S R W P E Q N P D E I D E T A L A R F G R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Q E M I S G I R N V R S T Y G V P P G R E I R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L I N V P E E E A E E V A H L E A H R D Y F A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L A R V S E L T V G M G L E R P K A S A T V V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G R Y E V Y V P L A D V I D L E Q E R A R L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E I A Q K E R F L E S V R K K L Q N P Q F L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
A P A E V V A R E R Q K E Q D A R A E L E R L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895
A N L A A L S
- - - - - - -
---------------------
Class I
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_val_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E M P K D Y N I E I E K Q I Q K K W E E S K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y K F D E E S N K P P Y I I D T P P P Y P T G R
- - - - - - - - - - - - I I D T P P . Y P T G R
------------------------------------ATTATAGATACACCACCA---TACCCAACTGGTAGA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L H L G H A L N W T Y M D I I A R Y K R M K G F
L H L G H A L N W T Y M D I I A R Y - - - - - -
TTACACTTAGGACATGCATTAAACTGGACTTACATGGATATAATAGCAAGATAC------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N V L F P Q G W D C H G L P T E V K V E E I H G
- - L F P Q G W D C H G - - - - - - - - - - - -
------CTCTTCCCGCAAGGTTGGGACTGTCATGGA------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I T K S D V D R H K F R E L C I E L T K E N I E
- - - - - - - - - - - - - - - - - - - K E N I E
---------------------------------------------------------AAAGAAAACATTGAA
121122123124125126127128129130131132133134135136137138139140141142143144
K M R R Q I K S L G I S I D W D K E Y I T M T P
K M R R Q I K S L . . . . D - - K E Y I T M T -
AAAATGAGAAGACAGATAAAATCCTTA------------GAT------AAAGAGTATATAACAATGACT---
145146147148149150151152153154155156157158159160161162163164165166167168
E Y I K K S Q T A F V R M Y K D G L I Y R G K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P V N W C P R C Q T A I A F A E V E Y K E R E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K L N Y I K F P A A D G E G H L L I A T T R P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L M A A C V A I L V H P E D E R Y K H L I G K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F I V P L F G H K V K L L A D E D V E K E F G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G A V M V C T F G D K T D V L W V N R H K L E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K K A I D E K G E L T E I A G K Y K G L K T E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A R E K I I E D L K K E G Y L V K Q E P I K Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V G V C W R C K T P I E I I V T E Q W F V N V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K L I P K V R E V A D E I K W I P E H M K I R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L N W I E D M D W D W V I S R Q R I F A T P I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V W Y C P K C G N V V V A K E E D L P I D P T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T G Y V C D K C G N K D L I P E T D V L D T W M
- - - - - - - - - - - - - - - - - - - - D T W M
------------------------------------------------------------GATACATGGATG
457458459460461462463464465466467468469470471472473474475476477478479480
D S S I T P M V I T K W L D D D K F F E K H Y P
D S S I T P M - - - - - - - - - - - - - - - - -
GACTCTTCAATAACACCAATG---------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V Q L R P Q G H D I I R T W A F Y T I V K S V A
- - L R P Q G H D I I R T . A F Y T I V K S V A
------TTAAGACCACAGGGGCATGACATAATTAGAACA---GCTTTCTATACAATTGTCAAGTCAGTAGCT
505506507508509510511512513514515516517518519520521522523524525526527528
L T G K K P W D E I V I N G M V F G E D G H K M
L - - - - - W . E I V I N - - - - - - - - - K M
TTG---------------TGG---GAGATTGTTATAAAC---------------------------AAGATG
529530531532533534535536537538539540541542543544545546547548549550551552
S K S R G N V V E P D E I I A K Y G A D A L R L
S K S - - - - - - - - - - - - - - - - - - - - -
AGTAAGAGT---------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
W A S N S V V G D D V Q F L W K E V D Y G Y R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L R K S W N A C R F A K M H I S D D I I D E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K P M E I S N P I D L W I L S K L Q R L I E R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D K D L E N Y R F N T I V E I Y K F V W H E F C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D N Y I E M V K Y R L Y G D D E E A K K E A R W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
T L Y Y V I D K V V R L L C P F A P H F S D Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A E I Y K I D N L H F S F P E V D N R F I N E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A E K F G E I A K N T V I S I R R F K A N S G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A L N A P L K Y V E I Y T E D E E T Y L A L N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
T A E D I K G T L K I E E L K I I K G K P A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
S K I V E I I P D K S K I G P E F K K N A K A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
M D L I K N A D E E T L E K I I N E G L E T E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
G V I R K E H I K D V K R A L F C E G E E V D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878
V D I E G V L A M A I I R K
- - - - - - - - - - - - - -
------------------------------------------
Class I
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_val_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G A K P S S G Q S F L P R I K E K R W S K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E K E L L E K W S E E R L Y E F D P D R E G P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L V I D T P P P Y P S G K W H V G G A A H Y A Q
- V I D T P P . Y P S G K W H V G G A A H Y A Q
---CAGGTCCTTGGCGAAGGG---CATCTCCTTGCTCAGGTATAGCTTGTAGCCCTCGACCTTCTGGGACAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I D M I A R Y F R M K G W N V F V P W Y A D R N
I D M I A R Y - - - - - - - - F V P W Y A D R N
CTTGTAGCCGTGGCTGCGCTT------------------------CTGGAGCACTTTGTCGAGCATCTTCGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G L P V E V T I E K K Y N I L A H E M A K T K E
G - - - - - - - - - - - - - - - - - - - - - - -
GTA---------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G R K K F L E L C S Q E L D R V E E E L V R I W
- - - - - - - - - - - - - D R V E E E L V R I W
---------------------------------------CATTCTCAGCAAGGCGTCCAGTATAGTGTGGAG
145146147148149150151152153154155156157158159160161162163164165166167168
R G L G C S F T Y I R N G T D S P E Y R R I T Q
R G L . . . . T - - R N G T D S - - - - - - - -
TGTGAACCA------------TTC------GCTGAACTCGCCCTCCCT------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A T F I E L W R R G L I Y E D E R P V N W C P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C R T S L S E A E I E H R E E D S Y L Y Y V K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R V K E T G E E I L I A T T R P E L I G A A R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V V Y N P E D E R Y K R L K G L H A I V P I Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y E V P I L E H P A A K P D F G T G L V M V S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y G D W T D V Q M I K D L G L E P K V I I N Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G T M N E K A G F L K G L P V R E A R R R M V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E L E K R G L I A K K E L I R H S V P V C W R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K T P V E I V H V R E Y F L K Q L E F Q D K L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I V K K M H F K P E K H R Q K L L D W I D S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K M D W P I S R T R Y Y G T E I P I W T C R R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G A K L V P E P G R Y Y R P W L E E P P W E R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P R C G A P R S E L E G E T R V F D T W F D S S
- - - - - - - - - - - - - - - - - D T W F D S S
---------------------------------------------------CTCGCGCACATGTACTATCTC
481482483484485486487488489490491492493494495496497498499500501502503504
I S V L Y A S G Y M R N L K L F E R V F S R D E
I S V L - - - - - - - - - - - - - - - - - - - -
GACGGGGGTTTT------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E L P Y T L R P Q G V D I I R T W L Y F S V L R
- - - - - L R P Q G V D I I R T . L Y F S V L R
---------------CACCATGCGGCGCCTGGCTTCGCGTACGGGCAG---TTTGAGGAACCCTGCCTTCTC
529530531532533534535536537538539540541542543544545546547548549550551552
V Y Q L L G K P A F R W V R V T G M G L D P K G
V Y Q L - - - - - F . W V R V T - - - - - - - -
GTTCATTGTGCC---------------CAC---GGGCTCCAGCCCGAG------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R A M H K S L G N V I D P E P Y I E A Y G A E P
- A M H K S - - - - - - - - - - - - - - - - - -
---GTCGCCATAGCTGCT------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
F R F W A A A A A R L G D D Y R F S E Q T L K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G K L F L T K L W N I A R F V S S F P R P T D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y R L R P I D L V F L G A L N N L I R R V D H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y G E E L D V H Q P V N E L Y N F T W N I F A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
H Y L E L V K T R A Y N R E G E F S E E E Q R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A W F T L H T I L D A L L R M L A P I L P F I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D A L Y R R L Y G D S V H R Q K F P E P N P E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D T A Y A K M L D K V L Q L N S A L W T W K R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
H G Y K L S Q K V E G Y K L Y L S K E M E P F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
K D L E Y M H R I E T V V G E P P E T A E K L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E G A Y I A G L R G G T G A Q R G G M T G A E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843
L N R
- - -
---------
Class I
Bacteria/Escherichia coli/amino acid sequences/Ecoli_val_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K T Y N P Q D I E Q P L Y E H W E K Q G Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K P N G D E S Q E S F C I M I P P P N V T G S L
- - - - - - - - - - - C I M I P P . N V T G S L
---------------------------------GGCGACAAAGCCTTCGTT---CAGCTTGTTCTCAATACG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H M G H A F Q Q T I M D T M I R Y Q R M Q G K N
H M G H A F Q Q T I M D T M I R Y - - - - - - -
GCTGATTTCGCCTTCGATCTTCGCTACTTCTTTCGCCAGACGTGCCAGCTC---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T L W Q V G T D H A G I A T Q M V V E R K I A A
- L W Q V G T D H A G - - - - - - - - - - - - -
---CATCGGGATCAGCAGTTCTGCGCCGTCGAC---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E G K T R H D Y G R E A F I D K I W E W K A E
- - - - - - - - - - - - - - - - - - - - - - A E
------------------------------------------------------------------TTCTGC
121122123124125126127128129130131132133134135136137138139140141142143144
S G G T I T R Q M R R L G N S V D W E R E R F T
S G G T I T R Q M R R L . . . . D - - R E R F T
ATCCGCGCTGCAACCACGCAGCAGCAGCTCCAGCGG------------GAT------TTCTGCACGGATGTT
145146147148149150151152153154155156157158159160161162163164165166167168
M D E G L S N A V K E V F V R L Y K E D L I Y R
M D - - - - - - - - - - - - - - - - - - - - - -
ACGTAC------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G K R L V N W D P K L R T A I S D L E V E N R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S K G S M W H I R Y P L A D G A K T A D G K D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L V V A T T R P E T L L G D T G V A V N P E D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R Y K D L I G K Y V I L P L V N R R I P I V G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E H A D M E K G T G C V K I T P A H D F N D Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V G K R H A L P M I N I L T F D G D I R E S A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V F D T K G N E S D I Y S S E I P A E F Q K L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R F A A R K A V V A A V D A L G L L E E I K P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D L T V P Y G D R G G V V I E P M L T D Q W Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R A D V L A K P A V E A V E N G D I Q F V P K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y E N M Y F S W M R D I Q D W C I S R Q L W W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
H R I P A W Y D E A G N V Y V G R N E D E V R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E N N L G A D V A L R Q D E D V L D T W F S S A
- - - - - - - - - - - - - - - - - D T W F S S A
---------------------------------------------------GGAGGAGAACCAGGTGTCGAG
481482483484485486487488489490491492493494495496497498499500501502503504
L W T F S T L G W P E N T D A L R Q F H P T S V
L W T F - - - - - - - - - - - - - - - - - - - V
AACGTCTTCATC---------------------------------------------------------GCG
505506507508509510511512513514515516517518519520521522523524525526527528
M V S G F D I I F F W I A R M I M M T M H F I K
M V S G F D I I F F . I A R M I M M T M H F - -
GCCAACATAAACATTACCCGCTTCGTCATA---TGCCGGGATACGGTGACCCCACCATAGCTGACG------
529530531532533534535536537538539540541542543544545546547548549550551552
D E N G K P Q V P F H T V Y M T G L I R D D E G
- - - - - - - - - F . T V Y M T - - - - - - - -
---------------------------GGA---ATACATGTTTTCGTA------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q K M S K S K G N V I D P L D M V D G I S L P E
- K M S K S - - - - - - - - - - - - - - - - - -
---GTTCTCAACCGCTTC------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L L E K R T G N M M Q P Q L A D K I R K R T E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q F P N G I E P H G T D A L R F T L A A L A S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G R D I N W D M K R L E G Y R N F C N K L W N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S R F V L M N T E G Q D C G F N G G E M T L S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A D R W I L A E F N Q T I K A Y R E A L D S F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
F D I A A G I L Y E F T W N Q F C D W Y L E L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
K P V M N G G T E A E L R G T R H T L V T V L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
G L L R L A H P I I P F I T E T I W Q R V K V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
C G I T A D T I M L Q P F P Q Y D A S Q V D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A L A D T E W L K Q A I V A V R N I R A E M N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A P G K P L E L L L R G C S A D A E R R V N E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R G F L Q T L A R L E S I T V L P A D D K G P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
S V T K I V D G A E L L I P M A G L I N K E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L A R L A K E V A K I E G E I S R I E N K L A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
E G F V A R A P E A V I A K E R E K L E G Y A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951
A K A K L I E Q Q A V I A A L
- - - - - - - - - - - - - - -
---------------------------------------------
Class I
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_val_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y D K N L E K E Y Y Q I C E E R G Y F E I D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N K T I Q E K D K N F C I M M P P P N V T G V L
- - - - - - - - - - - C I M M P P . N V T G V L
---------------------------------GATGAATTTTTCATTTGA---CATGGAGTTAAGCTTGAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H I G H A L T F T L Q D I M T R Y K R M D G Y K
H I G H A L T F T L Q D I M T R Y - - - - - - -
ACTTTCTTTTTCAAGCTTATTTTTTTGATTTTCAAGTCTTGTTAAAATACC---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L Y Q P G L D H A G I A T Q N V V E K Q L L T
- L Y Q P G L D H A G - - - - - - - - - - - - -
---AATAAAAATTTCTAAATTCTCGCTAACATC---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q G I K K E E L G R E E F I E K V W E W K E Q S
- - - - - - - - - - - - - - - - - - - - - E Q S
---------------------------------------------------------------TTTATCGTT
121122123124125126127128129130131132133134135136137138139140141142143144
G G K I L D Q M R T L G I T P A W S R L R F T M
G G K I L D Q M R T L . . . . A - - R L R F T M
AAATTTGATATAAGCTTTTTCTATTTTAGAATT------------TAA------AGCACGGCGGATACTAAC
145146147148149150151152153154155156157158159160161162163164165166167168
D E G L V N A V K K A F V E L Y D K R L I V R G
D - - - - - - - - - - - - - - - - - - - - - - -
TAT---------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N Y M I N W C T H D G A L S D I E V E Y K E N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G K L Y H I K Y F L K D S D E F L V V A T T R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E T F F G D T A V M V H P D D E R Y A K F V D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E V I L P I S K K A I K I I A D K H V E K E F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T G V V K V T P A H D M N D Y E V G L R H N L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F I S V F D E K G I L N E H C L E F Q G L E R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E A R E K I V A K L E S L G F I E K I E E Y N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q I G Y C Y R C N N I V E P Y I S K Q W F V K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E I A Q E S I E K V A L G E S K F Y P N H W I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S F N A W M K D L R D W C I S R Q L W W G H Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P V Y Y C E C S H E W A S Q H T P K T C P K C Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S Q N F K Q D E D V L D T W F S S G L W A M S T
- - - - - - - - - - - D T W F S S G L W A M - -
---------------------------------ACAAGTTTTAGGCGTATGTTGGCTTGCCCATTC------
457458459460461462463464465466467468469470471472473474475476477478479480
L G W G N E N W G K D K I W S E K D L K D F Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N S L L I T G F D I L F F W V A R M M F Q S T N
- - L L I T G F D I L F F . V A R M M F Q S T N
------CCAAGCATTAAAGCTATTTATCCAGTGATTTGG---AAATTTACTTTCTCCAAGCGCAACTTTTTC
505506507508509510511512513514515516517518519520521522523524525526527528
V L H Q L P F K D I Y L H A L V K D E Q G R K M
V - - - - - F . D I Y L H - - - - - - - - - K M
TAT---------------TTC---TTTTACAAACCATTG---------------------------GTTGCA
529530531532533534535536537538539540541542543544545546547548549550551552
S K S L G N V I D P N E S I K E Y S A D I L R F
S K S - - - - - - - - - - - - - - - - - - - - -
ACGATAACA---------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
T L A L L A I Q G R D I K L S N D K L L Q V R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
F T N K I Y N A K N Y L L L N E S K F E D L E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I T L H S E L A K Y I Y A K F Q T C V K D V R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
N L D N Y R F N D A A N T L Y K F F W D D F C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
W G I E L S K A E K S S V K E L G S I F K E A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
K L L N P F M P F I S E Y L Y H K L S D T E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
T S P S I M I S K Y P K F K E Q D K N I E K I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S L L I E S I V S I R R A K S L I D L G N S K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E K A Y I K F N D K K I K D E I K A Y M N F I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
M L A K C E Q I E F S E E K L P K A I C D V S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
N L E I F I T L E N V D L S G I L T R L E N Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
N K L E K E S F K L N S M L S N E K F I A N A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K E V V E Q N K E A L E N L K I Q L E K I S V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870
L Q N L R G
- - - - - -
------------------
Class I
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_val_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D T T L A K S F E P Q T I E S Q W G P E W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K R G Y A T P A L D P S R P D F S I Q L P P P N
- - - - - - - - - - - - - - - - S I Q L P P . N
------------------------------------------------TCGATCCAGTTGCCGCCC---AAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V T G T L H M G H A F N Q T I M D G L V R Y H R
V T G T L H M G H A F N Q T I M D G L V R Y - -
GTGACGGGCACGCTGCACATGGGCCACGCGTTCAATCAGACGATCATGGACGGGCTCGTGCGCTAC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M L G H N T L W V P G T D H A G I A T Q I V V E
- - - - - - L W V P G T D H A G - - - - - - - -
------------------CTGTGGGTGCCCGGCACCGACCACGCGGGC------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R Q L D A Q G V S R H D L G R E K F V E R V W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
W K E Q S G S T I T G Q V R R I G A S P D W S R
- - E Q S G S T I T G Q V R R I . . . . D - - R
------GAGCAGTCCGGCTCGACGATCACGGGCCAGGTTCGCCGCATC------------GAT------CGC
145146147148149150151152153154155156157158159160161162163164165166167168
E Y F T M N D K M S E A V R E V F V R L Y E Q G
E Y F T M N - - - - - - - - - - - - - - - - - -
GAGTACTTCACGATGAAC------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L I Y R G K R L V N W D P V L L T A V S D L E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V S E E E N G H L W H I R Y P L A D G S G H L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V A T T R P E T M L G D V A V M V H P E D E R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K H L V G Q R V K L P L C D R E I P I I A D D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V D R E F G T G V V K V T P A H D F N D Y Q V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q R H Q L A P I E I L T L D A K I N D N A P A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y R G L D R F D A R K A V V D E L D A Q G F L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S V K P H K L M V P R G D R T G V V I E P M L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D Q W F V A M T K P A P E G T F H P G K S I T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V S L D V V R R G Q I K F V P E N W T T T Y Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W L E N I Q D W C I S R Q L W W G H Q I P A W Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G E N G E I F V A R S E E D A R A Q A A A K G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A G A L R R D D D V L D T W F S S A L V P F S S
- - - - - - - - - - - D T W F S S A L V P F - -
---------------------------------GACACGTGGTTCTCGTCGGCGCTCGTGCCGTTC------
481482483484485486487488489490491492493494495496497498499500501502503504
L G W P N E T P E M K H F L P S S V L V T G F D
- - - - - - - - - - - - - - - - - V L V T G F D
---------------------------------------------------GTGCTCGTCACCGGCTTCGAC
505506507508509510511512513514515516517518519520521522523524525526527528
I I F F W V A R M V M M T T H F T G K V P F E T
I I F F . V A R M V M M T T H F - - - - - F . T
ATCATCTTCTTC---GTCGCCCGGATGGTGATGATGACGACGCACTTC---------------TTC---ACC
529530531532533534535536537538539540541542543544545546547548549550551552
V Y V H G L V R D A E G Q K M S K S K G N T L D
V Y V H - - - - - - - - - K M S K S - - - - - -
GTGTACGTGCAC---------------------------AAGATGTCGAAGAGC------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P I D I V D G I G L D A L V A K R T T G L M N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K Q A A S I E K K T R K E F P D G I P A F G T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A L R F T M A S M A T L G R N V N F D L A R C E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G Y R N F C N K L W N A T R F V L M N C E G H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
C G F D K P E V C G A G D C G P G G Y L D F S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A D R W I V S L M Q R V E A D I A K G F A D Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
F D N I A N A I Y K F V W D E Y C D W Y L E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
K V Q I Q N G T P E Q Q R A T R R T L L R V L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
T V L R L A H P I I P F I T E A L W Q K V A P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A G R Y P A G K A E G E A S L M V Q A Y P V A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P K K L D E A S E Q W A A E L K A V V D A C R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L R G E M N L S P A T K V P L L A A G D A A K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R A F A P Y V Q A L A R L S E V R V L P D E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
L D A D A H G A P I A I V G D N K L V L K V E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
D V A A E R E R L S K E I A R L E G E I A K C N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
A K L G N E A F V A K A P P A V V E Q E Q K R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955
A E F R N T L T K L G A Q L A R L P A
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_val_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T T S A S Q L Q T Q Y S P A A T E V R W Q K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W E E T S A F Q A N S Q S S A E P Y C I V I P P
- - - - - - - - - - - - - - - - - - C I V I P P
------------------------------------------------------TGCATTGTAATTCCGCCG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P N V T G S L H M G H A F E A S L I D V L I R F
. N V T G S L H M G H A F E A S L I D V L I R F
---AATGTGACAGGGAGCCTGCACATGGGCCATGCTTTTGAAGCCTCGCTGATTGATGTTTTAATTCGTTTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q R M R G K N A L W L P G T D H A S I A V Q T I
- - - - - - - - L W L P G T D H A S - - - - - -
------------------------TTATGGCTACCTGGAACTGACCACGCCAGT------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L D R Q L R E E G L S R Y D L G R E K F L E R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
W Q W K A E S G G T I V G Q L R R L G V S V D W
- - - - A E S G G T I V G Q L R R L . . . . D -
------------GCTGAATCAGGTGGAACGATTGTTGGTCAACTGCGGCGTTTA------------GAC---
145146147148149150151152153154155156157158159160161162163164165166167168
S R E R F T M D E G L S K A V L E A F I Q L Y E
- R E R F T M D - - - - - - - - - - - - - - - -
---CGTGAACGCTTCACGATGGAT------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E G L I Y R G Q Y L V N W C P A S Q S A V S D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E V E M K E V D G S L W Y F R Y P L T D G S G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L E V A T T R P E T M L G D T A V A V N P Q D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R Y Q H L I G K T I T L P L V Q R E I P I I A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P W V E A E F G T G C V K V T P A H D P N D F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
M G Q R H Q L P L I T V M N K D G T M N E N A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q F E G L D R F E A R K A V V A A L E E A G F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V K V E D Y R H S I P I S D R G K V P V E P L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S T Q W F V K I E P L A Q R A L E A L N G E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P R F V P E R W T K V Y R D W L E N L R D W C I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S R Q L W W G H Q I P A W Y A V S E T N G V V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D S T P F V V A K S A E E A Q Q Q A I A Q F G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D V V L Q Q D E D V L D T W F S S G L W P F S T
- - - - - - - - - - - D T W F S S G L W P F - -
---------------------------------GATACCTGGTTCTCATCTGGTTTATGGCCATTT------
481482483484485486487488489490491492493494495496497498499500501502503504
L G W P N Q T E D L E T F Y P T S T L V T G F D
- - - - - - - - - - - - - - - - - T L V T G F D
---------------------------------------------------ACCTTAGTCACGGGTTTCGAC
505506507508509510511512513514515516517518519520521522523524525526527528
I I F F W V A R M T M M A G H F T G K M P F K D
I I F F . V A R M T M M A G H F - - - - - F . D
ATCATCTTTTTC---GTGGCTCGGATGACGATGATGGCGGGTCACTTC---------------TTT---GAT
529530531532533534535536537538539540541542543544545546547548549550551552
V Y I H G L V R D E N N K K M S K S A G N G I D
V Y I H - - - - - - - - - K M S K S - - - - - -
GTCTATATCCAC---------------------------AAGATGTCAAAATCA------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P L I L I D R Y G T D A L R Y A L I R E V V G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G Q D I R L D Y N R K T D E S A T V E T S R N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A N K V W N A S R F V M L N L D D K T P E Q L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
M A A T A D L E L A D R W I L S R Y H A T T E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L I N Q I E A Y D L G A A A K Q L Y E F I W G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F C D W Y I E L V K P R L Y G E D A Q S R L V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Q Q T L A Q I L E G I L R L L H P F M P H V T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E I W H T L N Q V G E D Q F L A L Q S F P Q P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S E W I Q P E L D R E F Q L M I D V I R T L R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L R A E A G L K P G Q K I T A I L Q S D S E S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
R C N L E Q S Q A Y I R D L T K T E M L T I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
S L T E E P Q A L V G V T A T V Q V L L P L A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L V D L A A L Q T K L S R N L E K V E K E I K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
L S G R L N S S N F V D K A P A E V V A E T R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909
N L L E A E K Q A E L L R D R L T R L Q A
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Bacteria/Thermus thermophilus/amino acid sequences/Tthermophilus_val_aa
Bacteria/Thermus thermophilus/nucleotide sequences/Tthermophilus_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D L P K A Y D P K S V E P K W A E K W A K N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F V A N P K S G K P P F V I F M P P P N V T G S
- - - - - - - - - - - - V I F M P P . N V T G S
------------------------------------GCCGGGGGAGGCGAGCTT---CTGGCTCCGCTCCGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L H M G H A L D N S L Q D A L I R Y K R M R G F
L H M G H A L D N S L Q D A L I R Y - - - - - -
CAGGGCCAAAAGCTCCTTGAGCCGCTTCTCCTGGCGGCGCCGCCACTCCTCCAC------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E A V W L P G T D H A G I A T Q V V V E R L L L
- - V W L P G T D H A G - - - - - - - - - - - -
------GCGGGCCGTCACCCGGGGCATGGCCTTGAC------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K E G K T R H D L G R E K F L E R V W Q W K E E
- - - - - - - - - - - - - - - - - - - - - - E E
------------------------------------------------------------------CCGCAC
121122123124125126127128129130131132133134135136137138139140141142143144
S G G T I L K Q L K R L G A S A D W S R E A F T
S G G T I L K Q L K R L . . . . D - - R E A F T
CTCCTGGGCCGGGGGGAGCCCGGCCTCGGCCTTCAG------------CGT------CTGCTTCAGGGCCTC
145146147148149150151152153154155156157158159160161162163164165166167168
M D E K R S R A V R Y A F S R Y Y H E G L A Y R
M D - - - - - - - - - - - - - - - - - - - - - -
AAAGGC------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A P R L V N W C P R C E T T L S D L E V E T E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T P G K L Y T L R Y E V E G G G F I E I A T V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P E T V F A D Q A I A V H P E D E R Y R H L L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K R A R I P L T E V W I P I L A D P A V E K D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G T G A L K V T P A H D P L D Y E I G E R H G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K P V S V I N L E G R M E G E R V P E A L R G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D R F E A R R K A V E L F R E A G H L V K E E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y T I A L A T C S R C G T P I E Y A I F P Q W W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L R M R P L A E E V L K G L R R G D I A F V P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R W K K V N M D W L E N V K D W N I S R Q L W W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G H Q I P A W Y C E D C Q A V N V P R P E R Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E D P T S C E A C G S P R L K R D E D V F D T W
- - - - - - - - - - - - - - - - - - - - - D T W
---------------------------------------------------------------GTGCCCCCA
457458459460461462463464465466467468469470471472473474475476477478479480
F S S A L W P L S T L G W P E E T E D L K A F Y
F S S A L W P L - - - - - - - - - - - - - - - -
CCAGAGCTGGCGGGAGATGTTCCA------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P G D V L V T G Y D I L F L W V S R M E V S G Y
- - - V L V T G Y D I L F L . V S R M E V S G Y
---------GGCGATGTCCCCCCGCCTTAGGCCCTTTAGGAC---CTCCGCAAGGGGCCTCATCCTGAGCCA
505506507508509510511512513514515516517518519520521522523524525526527528
H F M G E R P F K T V L L H G L V L D E K G Q K
H F - - - - - F . T V L L H - - - - - - - - - K
CCACTG---------------CTC---GGGGGTGCCGCAGCG---------------------------GTC
529530531532533534535536537538539540541542543544545546547548549550551552
M S K S K G N V I D P L E M V E R Y G A D A L R
M S K S - - - - - - - - - - - - - - - - - - - -
CTCCTCCTTCAC------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F A L I Y L A T G G Q D I R L D L R W L E M A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N F A N K L Y N A A R F V L L S R E G F Q A K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D T P T L A D R F M R S R L S R G V E E I T A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y E A L D L A Q A A R E V Y E L V W S E F C D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y L E A A K P A L K A G N A H T L R T L E E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A V L L K L L H P M M P F L T S E L Y Q A L T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
K E E L A L E A W P E P G G R D E E A E R A F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A L K Q A V T A V R A L K A E A G L P P A Q E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
R V Y L E G E T A P V E E N L E V F R F L S R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
D L L P E R P A K A L V K A M P R V T A R M P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E G L L D V E E W R R R Q E K R L K E L L A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E R S Q R K L A S P G F R E K A P K E V V E A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862
E A R L K E N L E Q A E R I R E A L S Q I G
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class I
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_val_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E L S T R Y N P A E I E T K W Y R Y W E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G Y F T P K G V G E K F S I V I P P P N I T G R
- - - - - - - - - - - - S I V I P P . N I T G R
------------------------------------GTCTTTGTTTGCGAGTTT---CTCCAGACGATCTAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I H M G H A L N I T L Q D I V V R Y K R M K G Y
I H M G H A L N I T L Q D I V V R Y - - - - - -
TTCTTTCTGGATCTTCTCCATGATCTGTTTCAATCTCTCTTTTTCCTTTTCGAA------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D V L W V P G E D H A G I A T Q N A V E K F L L
- - L W V P G E D H A G - - - - - - - - - - - -
------ATAGGCCTCTATTTCCTCTTCAACGTAGGC------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q T Q G K T R E E I G R E K F L E I T W E W A N
- - - - - - - - - - - - - - - - - - - - - - - N
---------------------------------------------------------------------GTA
121122123124125126127128129130131132133134135136137138139140141142143144
K Y R R E I R E Q I K A L G A S V D W T R E R F
K Y R R E I R E Q I K A L . . . . D - - R E R F
CACCTTCACTCTCTGAGACTGCGGCAGATTCATCTCGGC------------GAC------CACCATGTTCAT
145146147148149150151152153154155156157158159160161162163164165166167168
T L D E G L S R A V R K V F V E L Y R K G L I Y
T L D - - - - - - - - - - - - - - - - - - - - -
GAGCCTGGT---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R G K Y I V N W C P R C K T V L S D E E V E H K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E H K S K L Y Y V K Y P V K D S D E Y I V V A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T R P E T M L G D T A V A V H P E D E R Y K N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V G K T L I L P L V G R E I P V V A D K Y V D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K F G T G A V K V T P A H D P N D Y L I A Q R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N L P M I E I F D D N A R I N E N G G K Y K G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D R Y E A R E K I V K D L E E Q G F L V K I E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y T H S V G H C Y R C D T V I E P K L S D Q W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V S T K P L A K R A I E A V E N G E I R F F P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R W T K V Y L N W M Y E I R D W C I S R Q L W W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G H R I P V W Y C Q D C G H L N V S E E D V E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
C E K C G S T N L K Q D E D V L D T W F S S A L
- - - - - - - - - - - - - - - - D T W F S S A L
------------------------------------------------CTGACAGTACCAGACGGGAATCCT
457458459460461462463464465466467468469470471472473474475476477478479480
W P F S T L G W P E E T E D L K R Y Y P T D L L
W P F - - - - - - - - - - - - - - - - - - - L L
GTGGCCCCA---------------------------------------------------------CTTCGT
481482483484485486487488489490491492493494495496497498499500501502503504
V T G F D I I F F W V A R M I M M G Y E F M N D
V T G F D I I F F . V A R M I M M G Y E F - - -
CCATCTCTCCGGGAAGAACCTTATCTC---ATTTTCTACGGCCTCAATAGCTCTTTTGGCAAG---------
505506507508509510511512513514515516517518519520521522523524525526527528
K P F S H V Y I H Q L V R D K Y G R K M S K S L
- - F . H V Y I H - - - - - - - - - K M S K S -
------GAA---CTGGTCGGAAAGCTT---------------------------GCAGTGCCCAACAGA---
529530531532533534535536537538539540541542543544545546547548549550551552
G N G I D P L E V I D E Y G A D P M R F T L A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L A A Q G R D I K L D P R Y F D A Y K K F A N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I W N A T R F V L M N L E D Y K E V P L E N L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T V D K W I L T R L N K T V E E V T N A L E N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D F N I A A R T I Y N F F W D D F C D W Y I E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S K P R L K T E E R N L V Q T V L V K V L D A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L R L L H P F M P F L T E E L W Q K L P V A G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
S I T I A K W P E I E R E L I D E T A E K E F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R L M N M V R G V R N V R A E M N L P Q S Q R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
K V Y I K G Y E V T E E E E L L L K T L G N I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E V S F V N E K P P K T A T A Y V E E E I E A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V D L G G L I D F E K E K E R L K Q I M E K I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K E I D R L E K K L A N K D F V E K A P E E V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E E T K E K L N T N R E R L A R L E S I L R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865
E
-
---
Class I
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_val_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T A T I P N L P S L Y D P F T T E A K W Q K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W E D N Q V Y K A D P Q R G G E P Y C I V I P P
- - - - - - - - - - - - - - - - - - C I V I P P
------------------------------------------------------TGCATCGTCATTCCTCCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P N V T G S L H M G H A F D N T L I D S L I R Y
. N V T G S L H M G H A F D N T L I D S L I R Y
---AACGTGACTGGTAGCCTCCACATGGGTCACGCCTTCGATAACACGCTGATAGATTCCCTGATCCGCTAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H R M K G Y N A L Y L P G T D H A S I A V H T I
- - - - - - - - L Y L P G T D H A S - - - - - -
------------------------CTATATCTCCCTGGAACCGACCACGCCAGT------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E K Q L Q A E G K T R Y E L G R E K F L E R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
W Q W K D S S K G T I V G Q L R R L G V S V D W
- - - - D S S K G T I V G Q L R R L . . . . D -
------------GACTCATCTAAGGGTACAATTGTCGGTCAACTGCGCCGCTTG------------GAT---
145146147148149150151152153154155156157158159160161162163164165166167168
S R E R F T M D E G L N K A V I E E F V R F H E
- R E R F T M D - - - - - - - - - - - - - - - -
---CGGGAACGCTTCACGATGGAT------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E G L I Y R S K Y L V N W C P A T Q S A V S D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E V E N K E V N G H L W H F R Y P L T D G S G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V E L A T T R P E T M L G D T A V A V N P N D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R Y K H L I G K T L T L P I M Q R E I P V I G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E F V D P E F G T G C V K V T P A H D P N D F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
M G Q R H D L P F I N I M N K D G T L N E N A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D F Q G Q D R F V A R K N V V K R L E A D G F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V K V E E Y K H A V P Y S D R G K V P I E P L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S T Q W F V K I R P L A D R T L S F L D E Q N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P Q F V P Q R W T K V Y R D W L V K L R D W C I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S R Q L W W G H Q I P A W Y A V S E T G G E I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D N T P F V V A R S E A E A R E K A N A Q F G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D V K L E Q D P D V L D T W F S S G L W P F S T
- - - - - - - - - - - D T W F S S G L W P F - -
---------------------------------GATACGTGGTTTTCTTCGGGATTATGGCCCTTT------
481482483484485486487488489490491492493494495496497498499500501502503504
L G W P D R T E D L E F Y Y P T A T L V T G F D
- - - - - - - - - - - - - - - - - T L V T G F D
---------------------------------------------------ACCCTAGTCACGGGATTTGAC
505506507508509510511512513514515516517518519520521522523524525526527528
I I F F W V A R M T M L G G H F T G Q M P F K D
I I F F . V A R M T M L G G H F - - - - - F . D
ATTATCTTCTTT---GTGGCAAGAATGACCATGCTAGGGGGGCATTTT---------------TTC---GAT
529530531532533534535536537538539540541542543544545546547548549550551552
V Y I H G L V L D E N G K K M S K S A G N G I D
V Y I H - - - - - - - - - K M S K S - - - - - -
GTTTACATCCAC---------------------------AAAATGTCCAAGTCA------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P L L L M D K Y G T D A L R Y T L V K E V V G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G Q D I R L D Y N R Q K D E S A S V E A S R N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A N K L W N A A R F V M M N L D G K T P Q Q L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
V E A L H A T S L Q L S D R W I L S R Y H Q V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K Q S T D Y I D N Y G L G E A A K G L Y E F I W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G D F C D W Y I E L V K S R L F Q K D A E G A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
S R L V A Q Q T L A Y V L E G I L K L L H P F M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
P H I T E E I W H T L T Q S E E G Q S I S V Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Y P E S D A T L I D S E L E Q Q F E L L I E A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
R T L R N L R A E A G I K P G V K V K A V M Q S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E S D R E R Q I L T S S E L Y I Q D L A K V E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L T I T S A L E T A L E P A I A D V V G T V Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L I P L A G V V D V A V L K A K L E K S L S K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
Q A E A K S L S A R L S N P T F V D K A P A D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
V Q G A K D A L A E A E K Q I E I L Q A R L R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914
L K
- -
------
Class I
Bacteria/Mycobacterium smegmatis/amino acid sequences/Msmegmatis_val_aa
Bacteria/Mycobacterium smegmatis/nucleotide sequences/Msmegmatis_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T A S P E N R A D A L P K S W D P G A V E A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L Y Q G W V D A G Y F T A D P A S D K P P Y S I
- - - - - - - - - - - - - - - - - - - - - - S I
------------------------------------------------------------------GCGCCG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L P P P N V T G S L H M G H A L D H T L M D V
V L P P . N V T G S L H M G H A L D H T L M D V
TTCGGCCTCGAC---GACAGTGCCCGACGTGTCGACCTCGACCACGACGGTGCCCTGCGACAGGCGCACCTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L T R R K R M Q G Y E V L W L P G M D H A G I A
L T R R - - - - - - - - L W L P G M D H A G - -
GACCGACGCCGA------------------------GGTGAGCCACGCGAGCGCGGCGACGGCGGG------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T Q T V V E K Q L A A D G K T K E D L G R E E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V A K V W D W K R E S G G T I G G Q M R R L G D
- - - - - - - - R E S G G T I G G Q M R R L . D
------------------------GATGAGCTTCTGCATATCGGTGATGCGTTGTGTCGCAACGGT---CGG
145146147148149150151152153154155156157158159160161162163164165166167168
G V D W S R D R F T M D E G L S R A V R T I F K
- - - - - R D R F T M D - - - - - - - - - - - -
---------------CTCGGGCCACGTCGCGACCAC------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R L F D A G L I Y Q A E R L V N W S P V L E T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I S D L E V K Y E D V E G E L V S F R Y G S M N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D D E P H I V V A T T R V E T M L G D T A I A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H P D D E R Y R H L V G K T L P H P F V D R D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V I V A D T H V D P E F G T G A V K V T P A H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P N D F E I G M R H G L P M P T I M D T K G R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A D T G T Q F D G M D R F E A R V K V R E A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A Q G R I V A E K R P Y L H S V G H S E R S G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P I E P R L S L Q W W V K V E S L A K A A G D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V R N G D T V I H P P S L E P R W F A W V D N M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
H D W C I S R Q L W W G H R I P I W H G P D G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T V C V G P D E T P P E G W E Q D P D V L D T W
- - - - - - - - - - - - - - - - - - - - - D T W
---------------------------------------------------------------TCCCCACCA
457458459460461462463464465466467468469470471472473474475476477478479480
F S S A L W P F S T M G W P D H T P E L A K F Y
F S S A L W P F - - - - - - - - - - - - - - - -
CAACTGCCGCGAGATGCACCAATC------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P T S V L V T G Y D I L F F W V A R M M M F G T
- - - V L V T G Y D I L F F . V A R M M M F G T
---------GGTGTCGCCGTTGCGCACCGCGTCACCCGCGGC---GGCGAGCGACTCGACCTTGACCCACCA
505506507508509510511512513514515516517518519520521522523524525526527528
F V G D D P A V T L E G A R G R Q V P F E N V F
F V - - - - - - - - - - - - - - - - - F . N V F
CTGCAG---------------------------------------------------GTG---GTACGGGCG
529530531532533534535536537538539540541542543544545546547548549550551552
L H G L I R D E F G R K M S K S R G N G I D P L
L H - - - - - - - - - K M S K S - - - - - - - -
CTTCTC---------------------------CGCCTCGCGCACCTT------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D W V E K F G A D A L R F T L A R G A S P G G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L S I G E D H A R A S R N F A T K L F N A T R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A L M N G A A P A P L P A A S E L T D A D R W I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L G R L E E V R A E V D S A F D N Y E F N R A C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E A L Y H F A W D E F C D W Y V E L A K V Q L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
Q E E V H T A R T T A V L A A V L D T L L K L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
H P V M P F V T E T L W K T L T G G E S V V V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
T W P E P S G F A P D T V A T Q R I T D M Q K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
I T E V R R F R S D Q G L A D R Q K V P A R L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
D V E A A G L T A Q L P A V A A L A W L T E A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
D G F S P S A S V E V R L S Q G T V V V E V D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
S G T V D V E A E R R R L E K D L G G R P E G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
G H H H G Q T R Q R G L P V Q G A R P G G R Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872
P G Q A S P G Q
- - - - - - - -
------------------------
Class I
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_val_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K I Y N H K I V E K D K N E K W I K K E Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S T H D L T K K P F S I L L P P P N V T G K L H
- - - - - - - - - - S I L L P P . N V T G K L H
------------------------------TCTATCTTGTTACCTCCT---AATGTAACAGGAAAATTACAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I G H A W N T T L Q D F L I R L K R L Q G Y D V
I G H A W N T T L Q D F L I R L - - - - - - - -
ATTGGGCATGCTTGAAATACAACTCTTCAAGATTTTTTAATTAGATTA------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L W L P G T D H A G I A T Q A K V E K R L L D Q
L W L P G T D H A G - - - - - - - - - - - - - -
TTGTGATTACCAGGAACTGATCATGCAGGT------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K I F K S D L T K E E L F E K A M D W K N E Y A
- - - - - - - - - - - - - - - - - - - - N E Y A
------------------------------------------------------------AATGAATATGCA
121122123124125126127128129130131132133134135136137138139140141142143144
N E I K K Q W S K L G L A L D Y K K E R F T L D
N E I K K Q W S K L . . . . D - - K E R F T L D
AACGAAATAAAAAAACAATGGTCAAAATTA------------GAT------AAAGAAAGATTTACATTAGAT
145146147148149150151152153154155156157158159160161162163164165166167168
E L S N K A V N D I F V M L Y K D G Y I Y R G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R A I Y Y D T F L Q T S L S N I E V I N V E K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S K M Y Y L K Y F L E N S N S E Y V L V A T T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P E T L A S D V A L I I N P N D K K N S H Y L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K N F V N P L T K K I I K M H S D D Y A I M N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G S G I V K I S A H D M N D F D V I K R L N L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V I E T I D K F G K M T N A I P E F E N M S S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E A R E N I V L K L K K E N L I D K I E N I K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N I I M S E R S N T V A E V L V M P Q W F I K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E P F S K M I L K K I Q N E N E D D K K V L F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P K K F E N I L K I W M Q E A H D W N I S R Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W W G H K I P A W Y D E K G N I K V Q T T S P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S N W T Q D Q D V L D T W F S S G I A P F S F L
- - - - - - - - - - D T W F S S G I A P F - - -
------------------------------GATACTTGATTTAGTAGTGGCATTGCACCTTTT---------
457458459460461462463464465466467468469470471472473474475476477478479480
N W P Q K S E F L K R Y Y P T S V I V T A Y D I
- - - - - - - - - - - - - - - - V I V T A Y D I
------------------------------------------------GTAATTGTGACAGCTTATGATATT
481482483484485486487488489490491492493494495496497498499500501502503504
I F F W V A R M Y F M G I Y S M K N I P F K K A
I F F . V A R M Y F M G I Y S - - - - - F K . A
ATTTTCTTT---GTTGCAAGAATGTATTTTATGGGTATTTATTCT---------------TTCAAA---GCT
505506507508509510511512513514515516517518519520521522523524525526527528
L I H G L I R D E Q G R K M S K S L G N G I D P
L I H - - - - - - - - - K M S K S - - - - - - -
TTAATACAT---------------------------AAAATGTCAAAATCA---------------------
529530531532533534535536537538539540541542543544545546547548549550551552
M D L I E K Y G A D S L R W F L M T N S T P G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D I R F N Y D K I E S A W S L I N K I W N I S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Y I K M L D S D K K E I I P E E I E Q N A N S W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I L E K F E N L K I L I Y E K S E T F E F S V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G K E I F K F I N E D F S S V Y I E I I K G T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S K E F I S K I W S N F L I L L H P F L P F L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
D H L Y F E L N K K E L L E S D F F E L K S R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
N N L F I D E T I E I I S T L R E Y R T R F N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S H K I D L N Y N L V S I N N S N Q C D F N L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L K K Y L I K K M A N A N F S E N G Q I F F K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
N N Y E L R L Q I P E E V K K E E E T I R I K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
I L F L E S E I K R S Q S I L S N E K F I N N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839
S E I K V K E E K E K L E K Y I K E F E E I K
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class I
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_val_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N C R P L E K Y D P K A F E D E I Y T K W L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N N V F L P D N S L F E K F S M V A P P P N V T
- - - - - - - - - - - - - - S M V A P P . N V T
------------------------------------------AGTATGGTTGCGCCTCCT---AATGTTACT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G V L H M G H A L N F V L Q D V L V R Y K R M K
G V L H M G H A L N F V L Q D V L V R Y - - - -
GGCGTGTTGCACATGGGGCATGCTCTTAATTTTGTTTTGCAAGATGTTCTTGTAAGGTAT------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R H N T L W L F G T D H A G I A T Q A V F E R H
- - - - L W L F G T D H A G - - - - - - - - - -
------------TTGTGGCTTTTTGGCACAGATCATGCAGGA------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K K I G K S K D D F E R E E L V Q E I F K L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D R H R G I I V N Q I N K L G A S Y D H S R E R
D R H R G I I V N Q I N K L . . . . D - - R E R
GATAGGCATAGAGGGATAATTGTTAATCAGATAAACAAACTT------------GAT------AGAGAAAGG
145146147148149150151152153154155156157158159160161162163164165166167168
F T L D E N L C K A V N K V F K D L Y F K G L I
F T L D - - - - - - - - - - - - - - - - - - - -
TTTACTCTTGAT------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y R G E Y L V N L D P G S G S V V S D E E I E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K E V D G K L Y F V K Y F I D N S S F I E V A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T R P E T M F G D T A I A V N P N D E R Y K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V G K E V T I P L T T K K I K V I A D F Y V D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A F G T G A L K V T P A H D P N D F E I S K R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N I S K V N I L T Q D G K L N K N V P L Q Y Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L S A K D A R F K I E T E L M E K G F L Q D V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K H K Q Q V G H C Y R S G E V I E P Y L S T Q W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F V R M K P L A D K A L K A L E N G E L K F Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K K W E N T Y K Y W L S N I R D W C I S R Q L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W G H R I P V W Y N V D T S E L I V S D T D P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L D E K N M G K R F V Q D P D V L D T W F S S W
- - - - - - - - - - - - - - - - - D T W F S S W
---------------------------------------------------GATACTTGGTTTTCTTCTTGG
457458459460461462463464465466467468469470471472473474475476477478479480
L W P F S S L G W P N V D V D F K N Y Y P T N T
L W P F - - - - - - - - - - - - - - - - - - - T
CTATGGCCCTTT---------------------------------------------------------ACC
481482483484485486487488489490491492493494495496497498499500501502503504
L I T A Y D I I F F W V A R M V M A G L E F T G
L I T A Y D I I F F . V A R M V M A G L E F - -
TTGATAACAGCTTACGATATAATATTTTTT---GTTGCAAGAATGGTGATGGCAGGATTAGAATTT------
505506507508509510511512513514515516517518519520521522523524525526527528
Q V P F K D V Y I T P L L R D K Q G K K M S K S
- - - F . D V Y I T - - - - - - - - - K M S K S
---------TTC---GATGTTTATATAACA---------------------------AAAATGTCAAAGTCT
529530531532533534535536537538539540541542543544545546547548549550551552
L G N G I D P L D I I N E Y G S D S L R F T L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F L S V Q G Q D L N I D A K D F M F G A K F A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K V F N A S K F I L L N L K N R K I L N D L K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N D I D K W L L T S L N S T I L G V E S S F A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y K Y N E A S K F V Y E F F W N D F C D W Y I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I S K I D L N N E N V D I Q N M A I S K L L F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L K K S L L I L H P F I P F V T E K I Y S E F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E K E D I L A L N E Y P N F D I A N N F Q E E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E I F K V L K T F I I A I R T L K S E F N I P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S V E I D V A L K F D A D F K Y E A Y F K A N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S I V K R M I N F K N I F Y N E N Y D G M L G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A A V G F E I Y A D V K S L I D K T K E L I R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E K Q L E K Y K M L N I S V S K K L E N E N F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
M N A P K E I V E S E K L K F V E F S S L I N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875
I N N Y I I N L K N L
- - - - - - - - - - -
---------------------------------
Class I
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_val_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E L S T H Y N P I E V E Q K W Y S H W M S Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F F K A S P H S E K E P Y T I V L P P P N I T G
- - - - - - - - - - - - - T I V L P P . N I T G
---------------------------------------AAATTTTGTATTGCTTAA---TTTAGTTACAGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L H M G H V L N T T L Q D V L I R K A R M Q G
V L H M G H V L N T T L Q D V L I R K - - - - -
TGCTAAAAAACCTTGATAATATTCCAGGTCCTTTTTCAATCGTCCTAACTCCTGTTC---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K E A C W V P G I D H A S I A T E T K V V A M L
- - - C W V P G I D H A S - - - - - - - - - - -
---------AATATAAAATGCATGCCCTTGAACATGGCA---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q A K G I Q K K D L T R E A F L A H A W E W K E
- - - - - - - - - - - - - - - - - - - - - - - E
---------------------------------------------------------------------TGT
121122123124125126127128129130131132133134135136137138139140141142143144
K Y G S I I L E Q I K Q L G A S C D W D R L H F
K Y G S I I L E Q I K Q L . . . . D - - R L H F
ATTACTGTAAAGCAATAACGGTTCTTTTGGGTTTATTTG------------GAT------AATTTCTGTAAT
145146147148149150151152153154155156157158159160161162163164165166167168
T M D A G P S E A V K K V F I Q L Y E K G Y I Y
T M D - - - - - - - - - - - - - - - - - - - - -
TAAAGTAAA---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q G K R M I N W D P V G K T A L A D D E V N Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P V S S K L Y Y V R Y A I V G S D Q H I I I A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T R P E T I L G D T A I C I H P H D M R Y Q H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H G K Q A I V P I A N R T I P I I T D T Y V D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D F G T G C L K V T P A H D M N D Y D L G Q R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G L E V I D I L N E D G T L N V T A G H Y I G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D R F V V R E K I A Q Q L Q A E G Y L E K I E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y T S N I G L S E R T H A V V E P R L S K Q W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V R I Q E L A K P A F E H V L D N T I Q F H P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K F K H M Y Q A W L N N V R D W C I S R Q L W W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G H Q I P A F Y L P D G T V I V A E D K A A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A K A H M N P V Y K N L T E A D I R Q D E D V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D T W F S S W L W P I S V F D G F G N P E N Q D
D T W F S S W L W P I - - - - - - - - - - - - -
AACCGTACCATCTGGCAAGTAAAATGCAGGGAT---------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I Q Y F Y P T Q V L V T A P E I I F F W V A R M
- - - - - - - - V L V T A P E I I F F . V A R M
------------------------ATACATATGTTTAAACTTGGCCGGGTGAAACTG---GGTATTATCCAG
505506507508509510511512513514515516517518519520521522523524525526527528
I M A G Y A F T N R L P F K H V Y F T G I V R D
I M A G Y A F - - - - - F . H V Y F T - - - - -
CACATGTTCAAAAGCGGGTTT---------------TCG---GAACCATTGCTTAGA---------------
529530531532533534535536537538539540541542543544545546547548549550551552
K L G K K M S K S L G N S P E P I D L I K Q Y G
- - - - K M S K S - - - - - - - - - - - - - - -
------------ACGTTCAGAAAGGCC---------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A D G V R V G M L F S S P A G N D L L F D I K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
C E Q G R N F A N K I W N A F R L I K G W E V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A K S S Q P D D T M A I N W F E A R F N Q V L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
T I E E H F E Q F R I S D A L M S I Y K L I W D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D F C A W Y L E M V K P A Y G E P I S P T T Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A T V E F L A K L L K I L H P F M P F I T E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
W H Q L Q P R S A Q D C I T V A P W P Q S I T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D N Q L L E E A A L S F T L I T E I R N I R V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A Q I N P K E P L L L Y S N T M L P A W F S R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S N Y I Q K L G Y I N Q I A V S E G P I Q D S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
S C H V Q G H A F Y I P F Q Q K I D V E Q E L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R L K K D L E Y Y Q G F L A A V T K K L S N T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
F V E Q A P P A V V E I E R R K Q S D A I A K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877
K V M E S R L L E I S G E
- - - - - - - - - - - - -
---------------------------------------
Class I
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_val_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T D P H T T T L P T Q F D P T G I E P K W A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R W R S E P F R A D A T S G K D P F T I V I P P
- - - - - - - - - - - - - - - - - - T I V I P P
------------------------------------------------------GCCCTGCGCCTGCTTGAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P N V T G N L H L G H A L D N T L I D T L I R Y
. N V T G N L H L G H A L D N T L I D T L I R Y
---CTTGTCGAGTTCGGCGAGGCGTTTTTGCTGCTTTTTCACCCAGTCGGCGATGTCCACCGTGCCTTCCAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K R M A G F E A L Y L P G M D H A G I S T Q V V
- - - - - - - - L Y L P G M D H A G - - - - - -
------------------------GGCCACCTGCGAGAGCGTGCGGCCTTCCAG------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V E R Q L K D A G T S R H D L G R E A F L E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
W E W K G K S G G M I L D Q L T R L G V S A D W
- - - - G K S G G M I L D Q L T R L . . . . D -
------------CGGCGAGAGGCCCAGTTCGCTCTTGAGGCTGCGAGCACTGTC------------CAG---
145146147148149150151152153154155156157158159160161162163164165166167168
T R E R F T M D E G L S R A V R T Q F V K L Y H
- R E R F T M D - - - - - - - - - - - - - - - -
---GAAAGCTTTGGTGGCTTCCGC------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D G L A Y R G E R I V N W D P A S Q T T L S E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E I D R E V R K G K M Y T L S Y K L E N S A E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G S N G E T G E I R I A T V R P E T I F A D Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I A V H P E D E R F R H L V G Q K A R I P L T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R W V P I I A D E A V E M E F G V G A L K I T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A H D P T D F E V G E R H G L E R P S V I D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G N L T R D E L V P A E F Q G L E R F A A R K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V V K A L E E S G D L L E Q K D H D T A I G L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E R T K V P V E P I I S E Q W F V K M K P F A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q V L E G L D K G E I K L V P E R Y T K V N R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W L E N I R D W N I S R Q L W W G H Q I P A W Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D K E G N I Y V P D P E N P E L D C D Q D P R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A H L N L R R D P D V F D T W F S S N L W P F S
- - - - - - - - - - - - D T W F S S N L W P F -
------------------------------------GGGGTTTTCCGGGTCGGGCACGTAGATGTTGCC---
481482483484485486487488489490491492493494495496497498499500501502503504
T L G W P D T D S E D F R K F Y P T Q V L V T G
- - - - - - - - - - - - - - - - - - - V L V T G
---------------------------------------------------------ATCGCGGATGTTTTC
505506507508509510511512513514515516517518519520521522523524525526527528
Y D I L F F W V A R M Q M A G Y G L T G Q A P F
Y D I L F F . V A R M Q M A G Y G L - - - - - F
CAGCCAGTCACGGTTGAC---CGTGTAGCGCTCGGGCACCAGCTTGATCTCGCC---------------CAA
529530531532533534535536537538539540541542543544545546547548549550551552
S T V M L H G L Y L D A K G Q K M S K S K G N G
. T V M L H - - - - - - - - - K M S K S - - - -
---CTGGTCGGCAAAGGG---------------------------AATGATGGGCTCCAC------------
553554555556557558559560561562563564565566567568569570571572573574575576
I D P L E L F G Q Y G V D A C R F A F T F L S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G G Q D I K H D A R R F E Q G R N F A N K L W N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A T R F A L M R L G E A R I E G S D D L S A Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
R A A V T L P D G V L L R S K D V L A Q L K E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
D D L T L A D R W I I S R L N D V T A E A S A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L D A F D I G A A I R T L Y S F T W D E F C D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Y I E A A K P E L A S G N L G T M A T L K V V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E H V L K L L H P F M P F I T S E L Y A A L G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
R R Q I A V H S W P Q P D A A L H D A E A T K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
F D A L R S A V D S A R S L K S E L G L S P Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
R L N V A V D G D L A D V V R Q N A R V V E G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A R V N L V P A L E G R T L S Q V A P G V T I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A P L E G T V D I A D W V K K Q Q K R L A E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K Q I K Q A Q G K L N N E G F V A R A P A E V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
E E E K R R V A D F G A Q K E R L E G V L A Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913
G
-
---
Class I
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_val_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E M K P K Y D P R E V E A G R Y E E W V K N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y F K P S E D K S K E T Y T I V I P P P N V T G
- - - - - - - - - - - - - T I V I P P . N V T G
---------------------------------------GTTTTCATTAGAGAGCTT---ATCTACTCTATC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K L H L G H A W D T T L Q D I I T R M K R M Q G
K L H L G H A W D T T L Q D I I T R M - - - - -
TAATTCGCTTTGAAGTTTAGCTAATTCTTTTTCCAAACGGCTGATTTCCTTATCCAT---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y D T L Y L P G M D H A G I A T Q A K V E A K L
- - - L Y L P G M D H A G - - - - - - - - - - -
---------TACCACTTTACCTGCAATTACAACTGATGT---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N E Q G I T R Y D L G R E K F L E Q A W D W K E
- - - - - - - - - - - - - - - - - - - - - - - E
---------------------------------------------------------------------TTC
121122123124125126127128129130131132133134135136137138139140141142143144
E Y A S F I R A Q W A K L G L G L D Y S R E R F
E Y A S F I R A Q W A K L . . . . D - - R E R F
TTTATCTTTAGCTTGAATTAAAATAGGTATTTCTTTAGA------------TAC------ACGTGATTGTCT
145146147148149150151152153154155156157158159160161162163164165166167168
T L D E G L S K A V K K V F V D L Y N K G I I Y
T L D - - - - - - - - - - - - - - - - - - - - -
TACAGATTT---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R G E R I I N W D P K A R T A L S D I E V I H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D V Q G A F Y H F K Y P Y A D V E G F I E I A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T R P E T M L G D T A I V V N P N D E R Y K D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I G K T V I L P I V G R E L P I L A D E Y V D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D F G S G A M K V T P A H D P N D F E I G Q R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q L E N I I V M D E N G K M N N K A G K Y E G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D R F D C R K Q L V E D L K E Q D L V I K I E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H V H S V G H S E R S G A V V E P Y L S T Q W F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V R M E D L A K R S L D N Q K T D D R I D F Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q R F E H T F N Q W M E N I R D W T I S R Q L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W G H Q I P A W Y H K E T G E I Y V G E E A P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D I E N W Q Q D E D V L D T W F S S A L W P F S
- - - - - - - - - - - - D T W F S S A L W P F -
------------------------------------ATCAGTTGGCGCTTCTTCTCCAACATATATTTC---
457458459460461462463464465466467468469470471472473474475476477478479480
T L G W P D L E S E D F K R Y Y P T N A L V T G
- - - - - - - - - - - - - - - - - - - A L V T G
---------------------------------------------------------CGTCCAATCTCTAAT
481482483484485486487488489490491492493494495496497498499500501502503504
Y D I I F F W V A R M I F Q G L E F T D R R P F
Y D I I F F . V A R M I F Q G L E F - - - - - F
ATTTTCCATCCATTGGTT---TGTATGTTCGAAACGTTGCGGATAAAAATCAAT---------------TTG
505506507508509510511512513514515516517518519520521522523524525526527528
N D V L L H G L V R A E D G R K M S K S L G N G
. D V L L H - - - - - - - - - K M S K S - - - -
---ATCTAATGAACGTTT---------------------------TTGCGTTGATAAATA------------
529530531532533534535536537538539540541542543544545546547548549550551552
V D P M D V I D E Y G A D S L R Y F L A T G S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P G H D L R Y S T E K V E S V W N F I N K I W N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G A R F S L M N I G E D F K V E D I D L S G N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
S L A D K W I L T R L N E T I A T V T D L S D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y E F G E V G R A L Y N F I W D D F C D W Y I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
M S K I P M N G N D E E Q K Q V T R S V L S Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L D N I M R M L H P F M P F V T E K I W Q S L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
H E G E T I V K A S W P E V R E S L I F E E S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Q T M Q Q L V E I I K S V R Q S R V E V N T P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S K E I P I L I Q A K D K E I E T T L S Q N K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
Y L I K F C N P S T L N I S T D V E I P E K A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
T S V V I A G K V V L P L E G L I D M D K E I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R L E K E L A K L Q S E L D R V D K K L S N E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
F V S K A P E K V I N E E K R K K Q D Y Q E K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876
D G V K A R I E Q L K A
- - - - - - - - - - - -
------------------------------------
Class I
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_val_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A A T Y D P A A V E A D W Y P W W E K S G F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R P A S D H K S E T A T K P F V I I A P P P N V
- - - - - - - - - - - - - - - V I I A P P . N V
---------------------------------------------ATTAGGGATAGACATCTT---CTTCAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T G Y L H L G H A L T G A V Q D T L I R F H R M
T G Y L H L G H A L T G A V Q D T L I R F - - -
TCCCTCAATCTGCTTCATGAGGCCGTCCAGCTGCTTCTCCAGCTTCGCCACCTCCTTCCCGAC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K G D N T L Y L P G T D H A G I A T Q V V V E R
- - - - - L Y L P G T D H A G - - - - - - - - -
---------------GTTCACGCCCACCTCCTTTGTCACCACGGA---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R V M K E E G K S R H D L G R D E F M K R L W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F K K N H A G M I T E Q F R R I G L S L D W T R
- - K N H A G M I T E Q F R R I . . . . D - - R
------CAGCTCCTGCAGCTCCGCCGTATGCGCCGTCACCCACACGTC------------GTT------CGA
145146147148149150151152153154155156157158159160161162163164165166167168
E R F T M D E Q S S A A V V E A F V R L H E D G
E R F T M D - - - - - - - - - - - - - - - - - -
GTACGAGGCCTTGGTGGA------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L V H R D T R L V N W C C A L Q S A I S D L E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E F V E V P K T S K M T I P L Y D R K V D M G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L T H V A Y K L A D S D D E L V I A T T R P E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L L G D T A V A I H P D D E R Y K K F H G K F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K C P F R D D I I P I V L D A T L V D M N F G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G A V K I T P A H D P N D F E S G K R H N L Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L V M M N L K G Y V T M E P F K G M H R F D C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R E I V K K L E E M G L L R G V E P Y E Y R V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R C E R T G D I V E P M L M P Q W F I D C S D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A R R S V E A V R N G D L R L Y P P S H E A V W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y H W L E N I K P W C V S R Q L W W G H R I P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y K V V G S L P K D V D P W V V A R N L Q E A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A K A K K K F G L T D E Q V A E A S F E Q D P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V L D T W F S S G L W P F A T L G W P T D S D D
- - D T W F S S G L W P F - - - - - - - - - - -
------GAACCAGGTGTCCAGCACATCCGGGTCCTGCTC---------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
M K R F F P N S L M E T G H D I L F F W V A R M
- - - - - - - - L M E T G H D I L F F . V A R M
------------------------GTGCGCCTCCTGCAGATTGCGGGCGACCACCCA---GTCCACGTCTTT
529530531532533534535536537538539540541542543544545546547548549550551552
V M L S L H F T N K L P Y K E V F L H A M V R D
V M L S L H F - - - - - Y . E V F L H - - - - -
CGGCAGCGAGCCGACAACTTT---------------GTG---CCACCAGAGCTGACG---------------
553554555556557558559560561562563564565566567568569570571572573574575576
K N G E K M S K S K G N V I D P L Y V I H G V S
- - - - K M S K S - - - - - - - - - - - - - - -
------------CAGCCAGTGGTACCA---------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L Q T L H N T V R S G N L G D K E V E K A I K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q K E F F P E G I P E C G S D A L R F G L L S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
T Q S G R S V N L D I Q R V V A Y R Q F C N K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
W N V V R Y V L Y H A L G T D Y V P S K Q Q F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
P A E D A A M L P L E C R W I L S R L D A A I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E A T Q G M S E G L Y D F A L A T G A V Y R F W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L H E L C D V F L E L T K P T I Q K G G E K Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L V Q D V L L H V V E K A L R L L H P M M P F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
T E E L W H R L P N Y S S F G S E S I M L A K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
P T P S G W L S A A S D S A M S I I L D V V H S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V R S T K A S Y S L T N K H K P D V W V T A H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A E L Q E L F A A E K M M I S T L G V V G E V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V V S P A E E T A A V P K G C G F S V V T K E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
G V N M M L M G F I D V G K E V A K L E K Q L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
G L M K Q I E G M K K K M S I P N Y E T K V P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
E I R V T N T E K L K T L E A Q S A Q L R D G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967
E K M S S L K
- - - - - - -
---------------------
Class I
Eukaryotes/Naegleria gruberi/amino acid sequences/Ngruberi_val_aa
Eukaryotes/Naegleria gruberi/nucleotide sequences/Ngruberi_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L K R I T I K Q A T P N N Q N K K F G L M K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L G I S S V H Q Q Q Y R N F H Y N N I Q D E T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S S E E S S T T K L N R I L T S S F D P S R V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q D W Y S W W E E K G L F K G E D S T T K P Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T I L L P P P N V T G S L H I G H A L T A S I Q
T I L L P P . N V T G S L H I G H A L T A S I Q
ACAATTTTACTTCCACCT---AATGTGACAGGAAGTCTTCACATTGGACATGCTCTCACTGCCTCTATTCAA
121122123124125126127128129130131132133134135136137138139140141142143144
D S L C R Y K K M N G Y N V L W V P G V D H A G
D S L C R Y - - - - - - - - L W V P G V D H A G
GACTCACTTTGTAGATAT------------------------TTGTGGGTTCCTGGTGTTGACCATGCTGGT
145146147148149150151152153154155156157158159160161162163164165166167168
I S T Q V A V E K K I A K E E G K T R H D L G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E E F L K R V W S W K E E Y G N R I D N Q M K A
- - - - - - - - - - - E E Y G N R I D N Q M K A
---------------------------------GAAGAGTATGGCAATAGAATTGATAATCAAATGAAGGCT
193194195196197198199200201202203204205206207208209210211212213214215216
M G S M T D W S R K V F T M D A Q F S S A V L E
M . . . . D - - R K V F T M D - - - - - - - - -
ATG------------GAT------AGAAAAGTCTTTACTATGGAT---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
C F V R L A R D G L I Y R D A K L V N W C P Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N T A I S D I E V E Y I S L K K K T K V M V P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
C E E K S F D F G V M H T F K Y P V I S S P G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T E I I G Y I N V S T T R L E T M L G D T A V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I H P E D E R Y K N F H N K F I L H P F D S K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A V P I I C D E K L V N M E I G T G A V K I T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A H S F E D F E C G K R H G L E F I T I L N K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G S L N D Q V P V E F S G K N R F I V R K L L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D K L K D M E L F I S E Q D H E M E L P I C S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S K D I L E P M L L N Q W F V K C D S L A K K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L D L V N N N E I L I H P S Y H K T T W N N W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E N I H D W C I S R Q L W W G H R I P A F K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G D L S K L E P L M E E L R K E K S F I M E Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
N K N S S N I E N I W I V A H K E E E A I S I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q K N V P N F S N F V L E Q D E D V L D T W F S
- - - - - - - - - - - - - - - - - - - D T W F S
---------------------------------------------------------GATACTTGGTTCTCA
577578579580581582583584585586587588589590591592593594595596597598599600
S G L Y P L A A F G W P S R S E N V L K D L D Y
S G L Y P L - - - - - - - - - - - - - - - - - -
TCTGGACTTTATCCATTG------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R Y P S S V M E T G S D I L F F W V A R M V M L
- - - - - V M E T G S D I L F F . V A R M V M L
---------------GTCATGGAAACAGGAAGTGACATTCTCTTCTTT---GTTGCAAGAATGGTCATGCTT
625626627628629630631632633634635636637638639640641642643644645646647648
C T Y L S D N K E K P F N E I Y L H S M V R D K
C T Y L - - - - - - - F . E I Y L H - - - - - -
TGCACTTACTTG---------------------TTC---GAAATTTACCTCCAC------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Q G R K M S K S L G N V I D P I D M I K G T T F
- - - K M S K S - - - - - - - - - - - - - - - -
---------AAGATGTCTAAAAGT------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E D L K R G I E K N T N I T K Q E M K K A L Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V Q Q E F P N G I P Q C G T D A L R F T L I Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
T Q Q G R Q I N L D V M R A Q S N R H L C N K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
W Q S A R F C L S H F E R F N Y S V P G N D E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L S E L L L K S F A S L E K S Q Q V L Q N Q W I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L L N L S E T I D V T R N S I D N F M F S D G C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
T S I Y Q F F I Y Q F C D N Y L E I V K P I L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S S N T M T P L I E N T L H T L N Y C L V T V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K L L H P Y M P F I T E E L Y H C C P L N G E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
N A L Y A K L S N K N S S Y I P T S S I L E C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
Y P T S F T A D E I G S I L E I G S S K Q L I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
E K M D K I L Q I V Q Q L R S M K Q N L Q L P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
K S E L T A Y I F Y Q G S S T T A F N L S E N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
I K I I Q T L T K F T S I K F I T E E E S K K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
K H T L Y L T A T A F S T P Q G T V M T Q L V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
P D E F Q L E K E I E K W Q K K I E Q L A S V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
A K Y L K Q V H P N L P P E V K Q Q I E D K L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
010611062106310641065106610671068106910701071107210731074107510761077107
Q N Q I E T Q K A Q E T C S Q L E H L L D N K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
810791080108110821083108410851086108710881089109010911092109310941095109
Q
-
---
Class I
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_val_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T L K M D R K A L K E E K K K Q K L E K F L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K K T T Q S K I S K A P K P A K N K S S S G Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P M P V E Q K W N N Y W L S N N L F E P Q E R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N K F V M C M P P P N I T G S L H I G H S M M I
- - - V M C M P P . N I T G S L H I G H S M M I
---------ATAACTTGTATACATCAA---ATTATCGAAAAACTGGGAATAAATCTCTTCTGTAATGAAGGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A I Q D A I C R Y M R L I N Y E V L Y L P G T D
A I Q D A I C R Y - - - - - - - - L Y L P G T D
CATATACGGACTGAATATTTTTATAGA------------------------TTGGATATATTTTTTAGTTTT
121122123124125126127128129130131132133134135136137138139140141142143144
H A G I A T Q T V V M K Q L E K E K K T Y N R E
H A G - - - - - - - - - - - - - - - - - - - - -
GATTTTTTT---------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S F L E A T W K W K E N Y G S R I L D Q F K R L
- - - - - - - - - - E N Y G S R I L D Q F K R L
------------------------------ATGTGTGGTAGAAATCACTTTATTTCTTTCTTGTATCAGCCA
169170171172173174175176177178179180181182183184185186187188189190191192
G T S A D F S R Q K F T M D A G M N K A V T E A
. . . . D - - R Q K F T M D - - - - - - - - - -
------------ATC------ATTAGACAAATCTAGATTAAG------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F C S L Y E K G L I Y R D N K I V N W C C K L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T T L S D I E I D Y L S V G K N T I L K I D G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D Y E F G V I Y V F K Y P V K F V K D G Y E S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G H I E V A T T R P E T I L G D V A L C A N P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D A R Y T K Y D K I I P R N P I T E E E L S F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F D E A A E M D L E S G V L K I T P A H D P I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F E I G K K N N L K N I K I F D N Q N K I I I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G N Y Y K L K R L D A R D L V V Q T L K N K N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F V E K K P Y E Q V L P M C S R S S D L L E P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I K E Q W W C S C S E M A K K A I D A V K T E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I K I Y P E E S K D D W Y R W F E N P R D W C L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S R Q L W W G H R I P A Y K T P D G V W T I A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N K E Q A I R S Y K K N N P L N A H Y Q E S D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V Q D E D V L D T W F S S G L W P F A T L G W P
- - - - - - - D T W F S S G L W P F - - - - - -
---------------------ATCTCTAGCATCAAGTCTTTTTAATTTGTAATA------------------
529530531532533534535536537538539540541542543544545546547548549550551552
N K N Q D L D K Y F P T S L L E T G K D I L F F
- - - - - - - - - - - - - L L E T G K D I L F F
---------------------------------------ATTCTTTTTTCCTATTTCAAAATCAATTGGGTC
553554555556557558559560561562563564565566567568569570571572573574575576
W V G R M V M M S L E L T G K V P F K K V L L H
. V G R M V M M S L E L - - - - - F K . V L L H
---TGCGGGGGTAATTTTTAAAACACCAGATTCAAG---------------TTCATC---AACAAAAGAAAG
577578579580581582583584585586587588589590591592593594595596597598599600
G I V R D A Y G R K M S K S L G N V I D P I H V
- - - - - - - - - K M S K S - - - - - - - - - -
---------------------------TATTATTTTATCATA------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I D G A S I E T L L D A L K L G N L T K E N L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
N A E S A V K K D F I N G I T V C G A D A L R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
T L L S Y M N G I N D I K L D I E R V K G N R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F C N K I W N A A L F V K K I V D E I I S S D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L S Y Q D L L N L D L S N E D D K L L V W L I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E R N K V I S T T H K A F K E Y K F M S A V Q S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
I H Q F F L Y D F C D V Y I E I V K K I K T K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
Y I Q A C F M M L I D S I K I F S P Y M P F I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E E I Y S Q F F D N S L M Y T S Y P E I I H N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
F S T N F K S T L S K I K A I R A D I E K Y G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E K V D V I L D G C E C F D K I D I Q F I S I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883
I P N I N T I K F G E G Y E V K K V N
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class I
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_val_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E G Q G K S K A K A A K A A K G G S G K A I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q K A E G K A L R T E L K A F E Y E Y E T P V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E K K N I S G A W P K A Y N P S V I E K S W Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W W E A A G F F S P D M Q K N I R S K D S R C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F T L L I P P P N V T G S L H I G H A L T N S I
- T L L I P P . N V T G S L H I G H A L T N S I
---ACCCTGCTGATCCCTCCA---AATGTCACTGGGTCCCTACATATTGGCCACGCTCTCACTAATTCCATT
121122123124125126127128129130131132133134135136137138139140141142143144
Q D A L V R W Y R M M G Y R T L Y L P G L D H A
Q D A L V R W - - - - - - - - L Y L P G L D H A
CAAGACGCGCTTGTGCGGTGG------------------------TTGTACCTCCCCGGGCTTGATCACGCT
145146147148149150151152153154155156157158159160161162163164165166167168
G I A T Q S V V E R N I M K T E G K T R H D L G
G - - - - - - - - - - - - - - - - - - - - - - -
GGG---------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R E R F L E R A W A W K E Q F G G R I L S Q L R
- - - - - - - - - - - - E Q F G G R I L S Q L R
------------------------------------GAGCAGTTCGGTGGGCGAATTCTGTCTCAGCTGCGA
193194195196197198199200201202203204205206207208209210211212213214215216
I L G S S F D W S R S V F T L D P A R S R V H N
I L . . . . D - - R S V F T L D - - - - - - - -
ATTTTA------------GAT------CGGTCTGTCTTCACGCTGGAC------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E S F V K L F N R G L I Y R D S R L V N W D C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L Q T A V S D V E V E Y I D L K L P R Q L S V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N H D P G K S Y P F G Y L W R F S Y K V I P S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L A D K S E A D L L T A F Q S G E L K F A C Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
C A K F Y T S S I L P L L D S D S I A E G S P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P Y E L L R L H Q C A D P G C L F T A E E L V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A T T R P E T I I G D T A V A V H P R D H R Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D L H G R C L F H P I L L G K K V P I V L D D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L V D M E Y G T G C V K V T P A H D P N D F E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G R R N K L E Y L Q I F T D D G R I V Q M I E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T H N G I T Y H L P A R F A G V K R F D G R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M L S Y L K E A A L Y R G R T P N P M V I G T C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q R S G D I L E P M V K P Q W Y L N C E Q M A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R A L N A V Y A P P S E A E R L L I V P E M H K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D T W K S Y L A N I R P W C I S R Q L W W G H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I P C Y K F W F G D N P E P S G D K T E H W V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A C S E E E A R R I I T K K H L D V Q G Q L H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K Q D D D V T D T W F S S G L F P F S C F A D S
- - - - - - - D T W F S S G L F P F - - - - - -
---------------------GACACGTGGTTTTCATCGGGGCTCTTCCCCTTC------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E R D F S R Y Y P G S V L E T G N D I I F F W V
- - - - - - - - - - - V L E T G N D I I F F . V
---------------------------------GTTCTGGAGACAGGTAACGATATCATCTTCTTC---GTG
673674675676677678679680681682683684685686687688689690691692693694695696
A R M V M L S L E L Y N V L P F R E V Y L H A L
A R M V M L S L E L - - - - - F . E V Y L H - -
GCTCGGATGGTCATGCTCAGTCTCGAACTC---------------TTC---GAGGTGTACCTCCAT------
697698699700701702703704705706707708709710711712713714715716717718719720
V R D A H G A K M S K S K G N V V D P I D V I K
- - - - - - - K M S K S - - - - - - - - - - - -
---------------------AAAATGTCGAAGTCT------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
G I T L Q E M G D K V R A T N L P P K E I E R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L E L Q S K D F P I G I P E C G T D A L R F A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
C A Y T G Q G R S I N L D V N K I V A Y R N F C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
N K I F N A V K F G C Y F S G I C D V L D V D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G A T N A C G R F W Q S N I R H Y E D F N D F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
M R V Y R T T L S A R T F K T T A A T V G E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
P T A A Y T T N D P N D I Y T P C T Q S E D H Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
S I V A A R W I L S R L Y N T V R T V T K S F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
E F R I A D A C T A I Y T F W Y D D L C D V F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
E L V K P I I A S M S A E P K R L D A H A E I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
R M V Y F C C I D Q G L R L L H P F M P F L S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
E L F Q H L P R W S K E E G L E T L M Y A E Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
T S Y G A H H F V T F G S K H E L L G E E L S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
D E Q K K V E G T S I Y R L S S V L R D R A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
210431044104510461047104810491050105110521053105410551056105710581059106
E M V A H L K P L M T A A R A L R G Q Y N I K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
010611062106310641065106610671068106910701071107210731074107510761077107
S S T P R Y Y I A C D K S D E H Y K H I M D G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
810791080108110821083108410851086108710881089109010911092109310941095109
Y V I K T L C N M R Q L D I V S P K V K F S N C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610971098109911001101110211031104110511061107110811091110111111121113111
G C T V L S A T L L I Y M D L R G L I D V E Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
411151116111711181119112011211122112311241125112611271128112911301131113
L S K V S K E M E Q I R T Q I E K L D K L M K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
211331134113511361137113811391140114111421143114411451146114711481149115
S N Y D R M P E H L R K Q N D E K M A G F L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
011511152115311541155115611571158115911601161116211631164116511661167116
L L Q L E E L A A S Y Q A M K E V E
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class I
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_val_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D A A R A T P K G Q K K D Y A A E M P K G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D P K F V E A A T Y A W W E D C G Y F K P N D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S D A E P F V I V I P P P N V T G S L H L G H A
- - - - - - V I V I P P . N V T G S L H L G H A
------------------GTGATCGTTATCCCACCC---AATGTGACGGGCTCGTTGCACCTTGGCCATGCT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L M V A V E D T L T R W H R M S G R N A L W V P
L M V A V E D T L T R W - - - - - - - - L W V P
CTCATGGTCGCCGTAGAGGATACACTGACGCGGTGG------------------------CTGTGGGTACCT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G T D H A G I A T Q T V V E K Q L Q R E Q G I T
G T D H A G - - - - - - - - - - - - - - - - - -
GGAACAGACCATGCAGGC------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R H D L G R E A F V G E V Y K W V D T Y G G K I
- - - - - - - - - - - - - - - - - D T Y G G K I
---------------------------------------------------GACACTTACGGAGGCAAGATC
145146147148149150151152153154155156157158159160161162163164165166167168
L A Q L R R M G A S P D W S R L A F T M D D K L
L A Q L R R M . . . . D - - R L A F T M D - - -
CTGGCGCAGCTGCGGCGTATG------------GAC------CGCCTGGCATTCACCATGGAC---------
169170171172173174175176177178179180181182183184185186187188189190191192
S A A V L E A F L R L H K E G L I Y R D N R L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N W C T R L K T A V S D I E V D Y I D I A E N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E L A V P G Y D E K V M F G V L T S F A Y P L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D G A G E I V V A T T R P E T M L G D T A V A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H P D D P R Y A H L H G K H V V H P L D G R K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P I I T D A E L V D I S F G T G A V K I T P A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D P N D F A T G K R H A L D F I N I L T N D G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I N E R G G Q F A G Q P R F Q A R K T V V D W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K E K G L Y R G E A G N A M R L G L C S R S K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V I E P V L K P Q W W V S C K G M A D D A C A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V R D G R I S I L P D E F K A T W F R W L E N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R D W C I S R Q L W F G H R I P A Y Y V T L E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E G D A A P P G T M D E R M D R W V V A R D A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S A R K V A E E R F P G K V Q N L V Q D D D V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D T W F S S G L F P F S V F G W P E Q T P D L A
D T W F S S G L F P F - - - - - - - - - - - - -
GACACCTGGTTTTCCTCGGGCCTGTTCCCCTTC---------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K Y Y P T T L L E T G H D I L F F W V A R M V M
- - - - - - L L E T G H D I L F F . V A R M V M
------------------CTGCTGGAGACGGGGCACGACATCCTCTTCTTC---GTCGCCCGCATGGTCATG
553554555556557558559560561562563564565566567568569570571572573574575576
M G M K L T G E V P F K Q I Y L H S M V R D A H
M G M K L - - - - - F . Q I Y L H - - - - - - -
ATGGGCATGAAACTC---------------TTC---CAGATCTACCTGCAC---------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G R K M S K S L G N V I D P L H V I E G I S L E
- - K M S K S - - - - - - - - - - - - - - - - -
------AAGATGTCCAAGTCC---------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G L Y S T L G G G N L E K N E M E R A K Q G Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A D F P E G I E E C G T D A L R F T L L S Y T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Q A L S V N L D I K R V V A N R Y W C N K L W N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A V K F A L E R L G D D F R P S P Q L P A A A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L P L P C R W I L S R L N A A T Q K V V T G F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
T Y S F A D G T Q A L Y G W W Q Y D L C D V F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E L V K P V I P R P G A E A E A A G A E T A A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A A F T S S P E G Q Q A Y K D T L W L C L D T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L R L L H P F M P F V T E E L W Q R L P G R R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
Q S G G F A S I M I A P F P A A Q P S W A D P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
G E D E V A L I L D V V R A A R S L R S D Y D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K T K Q R Q A L H I A C K V A S S A D V L R R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
S E L I G T L A L S D T V K V L Q E G E E A P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
G C G V Y V V N D A M T V C L D L E G I V D P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
K E A E K L Q A K Q A K L A E Q I E V L N T K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
S M S D Y E E K T P E D I R R A D A E K L K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005
A D E E A M L Q Q H L K S M L E R A Q Q R
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class I
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_val_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K A V S S F N N A S E M L A K V Y E P V E T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A R W Q K A W E E S R I F H P D P N A P G E P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S V V I P P P N V T G S L H M G H A F N S A L I
S V V I P P . N V T G S L H M G H A F N S A L I
TAGAATTTCTTTATTAGC---TGATAAATCTCTCTCCAAACGAATTCTAAGAGCTTCTAGATCGACTAATCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D T I V R F Q R L L G K N T L C L P G T D H A S
D T I V R F - - - - - - - - L C L P G T D H A S
ATCAATAGGAAGCAATAC------------------------TAAACATGAAGGTAATTCTGGACTTTCCCA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I A V Q T I L E R Q L K E Q G K S K E D L G R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G F L D L A W R W K V Q S G G I I V N Q M R R L
- - - - - - - - - - V Q S G G I I V N Q M R R L
------------------------------TGCAAACTGATTCGGCTTAAGTCCGGCTACTGTACGAAGGTT
145146147148149150151152153154155156157158159160161162163164165166167168
G Y S A D W Q R E R F T L D K G L N D A V I E A
. . . . D - - R E R F T L D - - - - - - - - - -
------------AAT------AATAAATTCTAAGAATTGTTG------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F V L L H E Q G L I Y R G E Y L V N W C P A S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S A V S D L E V E T R D V K G S L W Y F R Y P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K N S S A Y L E I A T T R P E T L L G D V A V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V N P D D K R Y K S L V G Q K L I L P L V G R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I F I I A D D H V D A N F G T G C V K V T P A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D P N D F A I G M R H N L S Q V T V I D K N G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
M N D M A G I F A G L D R F Q A R K A V V A A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E A K G L L V K I E T Y Q H S I P Y S D R G K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P I E P L L S F Q W F V N A E P L A L N C R E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L D T D H L K F V P K R W E K V Y R N W L I D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R D W C I S R Q L W W G H Q I P V W F V I S E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N S Q L N E H T P Y I V A R T S V E A L E Q A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E C Y G D K I V I N Q D E D V L D T W F S S G L
- - - - - - - - - - - - - - - - D T W F S S G L
------------------------------------------------AGCCACTATATAAGGCGTATGCTC
481482483484485486487488489490491492493494495496497498499500501502503504
W P F S T L G W P D S N S A D F Q C W Y P N S T
W P F - - - - - - - - - - - - - - - - - - - - T
GTTAAGTTG------------------------------------------------------------ACT
505506507508509510511512513514515516517518519520521522523524525526527528
L V T G F D I I F F W V A R M T M M A S S F T K
L V T G F D I I F F . V A R M T M M A S S F - -
AATACACCAATCTCTAATGTCTATTAGCCA---GCGATATACTTTTTCCCAGCGTTTTGGTACAAA------
529530531532533534535536537538539540541542543544545546547548549550551552
K M P F K E V Y I H G L V R D E N N C K M S K S
- - - F . E V Y I H - - - - - - - - - K M S K S
---------ATC---TGCTTCACGACAATT---------------------------CCATTGAAAAGATAA
553554555556557558559560561562563564565566567568569570571572573574575576
M G N G I D P L V L I D R Y G A D A L R F A L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
W E V A G A G Q D I R L D Y N R N E N T S L K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E S S R N F A N K I W N A C R F T L M N L N D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
N T N N L G T P D P R Q L K L S D R W I L S R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A Q V N I E M S E Y Y S S Y N L G E A A K A I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E F T W N D L C D W F I E L A K R R I N S D D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
T L R Q T T F Q V L M I V L E Q I L V M L H P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
M P H I T E E L W H G L M R V P A N V F L A N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
P W P M I D R G A I D N L L E Q Q F L E F I E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I R I V R N L R T V A G L K P N Q F A P V L F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
T K R S D L A A V L K E S I Q D I M S L T R A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L V E I L W E S P E L P S C L S G M S G E L Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L L P I D G L V D L E A L R I R L E R D L S K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
N K E I L I L I N R L D N P N F I N K A P E I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
V S E A K T N L E Q L K I Q S A V A Q G R L D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916
I L G F
- - - -
------------
Class I
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_val_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_val_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A T D K F K L F A D F L K D K P S L K H E M P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L S Y N P S E V E S H W D A I W C E S K I Y L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N F E R A S N L P F E N K F V I A L P P P N V T
- - - - - - - - - - - - - - V I A L P P . N V T
------------------------------------------GTTATTGCCCTTCCTCCC---AATGTTACG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R L H L G H T L T A A I Q D S L C R Y N R L I
G R L H L G H T L T A A I Q D S L C R Y - - - -
GGAAGGCTTCATTTGGGTCATACACTTACTGCAGCAATTCAAGATAGTTTATGCCGTTAT------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G K E V L W I P G T D H A G I A T Q T V V E R I
- - - - L W I P G T D H A G - - - - - - - - - -
------------CTTTGGATTCCAGGCACAGATCATGCCGGC------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I H Q T D N V T R H D L G R D N F L K K V W E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K E K H G S A I C S Q F R R L G C S L D W S R E
- E K H G S A I C S Q F R R L . . . . D - - R E
---GAAAAACATGGATCTGCTATCTGTTCTCAATTTCGTAGACTT------------GAT------AGAGAA
169170171172173174175176177178179180181182183184185186187188189190191192
F F T L D E N M S K A V N N A F I Q L F N Q G Y
F F T L D - - - - - - - - - - - - - - - - - - -
TTTTTTACCTTGGAT---------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I F R K T R L V S W C S Y L R T A L S D I E V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L L E V N K P S R I R I P G Y E K T V E V G V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
W H F S Y P L E Q H G Q T H E W H F M P E N I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N I E K I T V A T T R I E T M L G D V A I A V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P K D N R Y K S L I G K Y C L H P F I K D R K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I I I A D E H V D P E F G T G C V K I T P A H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K N D F E I A S R Y N E K H K S E P L F E K L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F I S V F T N D G N I G P G F G I F S G I H R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K C R E L V E K E L E K I K L L V E K T P N S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A M Q I P I C S R S N D I V E L F L I P Q W W M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N C K P F A E K A C K A V K N H E L Q I E P K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
H E Q T W F Y W L E N I Q D W C I S R Q L W W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
H R I P A Y K I I S S K L N S T E E I W V A A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D E E T A I K E A I Q K Y G L S E C D F H V E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D S D V L D T W F S S G L I P F S P L G W P D E
- - - - - D T W F S S G L I P F - - - - - - - -
---------------GATACATGGTTTTCATCTGGTTTAATACCATTT------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V N Q K T K L N D L S T F F P T T L L E T G S D
- - - - - - - - - - - - - - - - - L L E T G S D
---------------------------------------------------CTTTTAGAAACTGGATCAGAT
577578579580581582583584585586587588589590591592593594595596597598599600
I L F F W V A R M V M L S F A C T D K L P F K T
I L F F . V A R M V M L S F A C - - - - - F . T
ATATTATTCTTT---GTTGCGCGAATGGTCATGTTGAGTTTTGCTTGT---------------TTC---ACT
601602603604605606607608609610611612613614615616617618619620621622623624
I Y L H A M V R D S Q G R K M S K S L G N V I D
I Y L H - - - - - - - - - K M S K S - - - - - -
ATTTATTTACAT---------------------------AAGATGTCAAAATCA------------------
625626627628629630631632633634635636637638639640641642643644645646647648
P I E I I E G I S L D D L N K K L D Q G N L P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Q E I K K S K E N N L K D F P D G I P E C G A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A L R I G L L A Y T K Q G R N I N L D T K R V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A Y R H F C N K L W N A C K F A F G N I E N V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
N H M K Q N F E A I T I N E L F S N H S E D L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
W E D Y Y I L Y R L M V C I N C V K E S F D N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L F S D V V T A T Y N F W L Y E L C D V Y L E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
I K S R F K N I E S S F R Y A Y T A A Q V L S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
C I E Y G L V L L H P L T P F V T E E L Y Q R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K Q V T R S S I I S S I S T S E F P Q I F V H N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G L I S S R D H E F K K M M N I V T K I R S L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
A I L G I S N K D K I N I K V H V V Y N G T D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
E Y I D L I S N V A A A F V T K L S Q I G G T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
V L L N P S I D E I D E L K K N C L L D I V D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
K T V Y Y L K P P E F V D L S I A L K K I E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
985986987988989990991992993994995996997998999100010011002100310041005100
I D S N V K S L E S Y N K K K S S S S Y D K V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
610071008100910101011101210131014101510161017101810191020102110221023102
E S V K K L N D E K I D Q L V S T I D A L R V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
410251026102710281029103010311032103310341035103610371038103910401041104
H S N I E S L I N Q
- - - - - - - - - -
------------------------------
Class II
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_ala_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q A D P K E Y Q L E F F R E K G F T R R R C H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V G G E Y F W T L N P E Q E H C N D A P C V E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y F W N L P K K V N D L S V A E A R R K F I R F
- - - - - - - - - - - - S V A E A R R K F I R F
------------------------------------TGCACCAATCTCTACCATTAATCCTTGTTCCACGGG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F E R N G H E F I E P R P V V A R W R E D L Y L
F E R N G H E F I E . R P V V A - - - - - - Y L
TATTAGCGCAATTGTAATGCCATCAGGATC---TTGGCTTAGTAATTT------------------ATCATG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T I A S I V V F Q P H V T S G V V P P P A N P L
T I A S I V V F Q - - - - - - - - - - - - N P L
GAGCGGCAGTTTATCTTTAACAACATA------------------------------------GATCCTCTC
121122123124125126127128129130131132133134135136137138139140141142143144
V I V Q P S I R L E D I D N V G L T L G R H L T
V I V Q P S I R L - - - - - - - - - - - - - - T
GGCTAATTGTTCGACTATATATCTCCG------------------------------------------TAG
145146147148149150151152153154155156157158159160161162163164165166167168
S F E M G G H H A F N Y P D K H V Y W K E E T V
S F E M G G H H A F - - - - - - - - - K E E T V
CTTCTCTACACGCTTCTCGAGCTCCGTGAC---------------------------GTTTACACGCTCCTC
169170171172173174175176177178179180181182183184185186187188189190191192
R L A F E F F T E E L G I P P E H I T F K E S W
R L A F E F F T - - - - - - - - - - - - - - - -
AAGCTCTGAGGCATAACGAGCAAC------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W E G G G N A G P S F E V T V G G L E L A T L V
- - - - - - - - - S F E V T V - - - E L A T L V
---------------------------TATCTCGGCAGTATTGGC---------GCCAAAGCACGCCTCTAC
217218219220221222223224225226227228229230231232233234235236237238239240
F M Q Y R V T D G G Y E P I P L R V V D T G Y G
F M - - - - - - - - - - - - - L R V V D T G Y G
ATCCCA---------------------------------------AACGCCACCTTGATATAGCCTAAATCC
241242243244245246247248249250251252253254255256257258259260261262263264
I E R L A W F T Q K V P T A F H A I Y G S L L D
I E R L A W F - - - - - - - - - - - - - - - - -
GTAGAGTTTCTCGGCCTCATT---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E F Y K L L G I E P A P R N L L W A A A R D A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R L D P E N P E S I K R F Y E R A A R D V G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P S E A E K L L R R E A A V Y A L L D H S K T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A L M L A D G I V P S N T G E G Y L A R L V I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A I R L I K K L G S D V S L V E L V E R Q A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F W G N D Y Y P Q M L R N I D Y I L K V T R I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E E R Y R R S L E R G L R E V T R L L R R K R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L S L D D L I V L Y D S H G L P P D M V A E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A K L G V K V D V P H N F Y A I V A E R H G A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G G I A R R A E H P S L P Q D V V G W L K G F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A T E R L F H Q N P Y L R E F N A K V L G V K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V Y L V L D R T A F Y P T G G G Q L H D T G V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R L C G E E Y Q V K R V E K V G D V I V H V L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R E P R S N C S E A W G R I D W E R R Y R L M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
H H T G V H V I L G A A R R V L G E H V W Q A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A E K T P E K A R L D I T H Y E T P S P E E I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
R I E E L A N R A I L E R I D V E T K I M D R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E A E K L Y G F R L Y Q G G V P M T P K L R V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
K I G D W D V E A C F G T H V A N T A E I G A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
K I T R V E K L Q D G V I R L E L V A G S E V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
R Y A S E L E E R V N R V A N I V S G S V T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E K R V E K L I R D Y N N T R Q N L N K L R R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
I V E Q L A E R I K K E P L T I D G I R I Y V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K D K L P L H D L Y Q E L T K L L S Q E D P D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
I T I A L I P V E Q G L M V E I G A G S S A S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
R V N L R E L A R L L S N K G F R G G G K P T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
I N M L A R N V D E N E V L E V I I S A L R E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917
I K E K P
- - - - -
---------------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_ala_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L M E K Q T G E L D L K F F K N N G F E K K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
C R V C G S Y F W T T D S R R E T C G D T P C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E Y T F I G N P P V P K K Y T L S E M R K A F F
- - - - - - - - - - - - - - T L S E M R K A F F
------------------------------------------GATCCTTGAAACTATGTCGATATCGCTTGT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D F F E K R G H K L L E P Y P V V P R W R E D V
D F F E K R G H K L L E . Y P V V P - - - - - -
TTCAGCTTCTATTGCAGGAATCTCCTTTTCCCCAAG---TATCGAGTTGGATTT------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L L V N A S I Y D F Q P H V T S G I V K P P G N
L L V N A S I Y D F Q - - - - - - - - - - - - N
TAGTTTTGTACGGGCAGAGTCTAGATCTCTTTT------------------------------------ATC
121122123124125126127128129130131132133134135136137138139140141142143144
P I V M S Q P S I R M N D V D L V G V T G R H L
P I V M S Q P S I R M - - - - - - - - - - - - -
GCCAGCTTGATCTATGTTCTTTTTCGATATATT---------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T S F E M L C H D A F N S K N D F V Y W K E E T
T S F E M L C H D A F - - - - - - - - - K E E T
CTCCAAAGCCGGAACACCTGCAACGAACGTTAT---------------------------TATCTTCTTTAT
169170171172173174175176177178179180181182183184185186187188189190191192
V R Y S Y E F L T D G L G I D G S L I T Y K E K
V R Y S Y E F L T - - - - - - - - - - - - - - -
CTTAAGCACACCTATCGACGATATATT---------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P W S G G G N A G N A L E V F V R G L E V A T L
- - - - - - - - - - A L E V F V - - - E V A T L
------------------------------AACGCCACCTTCAAAGAG---------ATACTTACCTATGGC
217218219220221222223224225226227228229230231232233234235236237238239240
V F M D M K E D Q E G E V E I E G T R Y T K M D
V F M - - - - - - - - - - - - - - - - - - - - -
CATATACCA---------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
M Q I V D T G Y G L E R L T W L S Q G T P T V Y
M Q I V D T G Y G L E R L T W L - - - - - - - -
CTTTTTGATGGTGTCCTCATCAATTCTTTTGTAGTGGGTTATGTCAAG------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q A I Y P E I I D Y V L E N S Y V E S I D N E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L S D V V R V S V M R E P Y D E A F V L S T L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E K Y P N A L E R F E K A K K V R D I F V L I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H A R S L M H M F E A F V I P S N V K V G Y L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R L L I R R S I R A Q K N I G F K G S L I N L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E R N Y N E L K D I V K P L P I E F I K D V L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I E M Q K Y S E L E K R G Q Q V I E K I L K T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K S I D I D D L V L L Y D S H G I S P D V V A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
M A A E K G L K V M I P P N F H A M V I S R H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K K S A L K K S A K V Y P N I E T R T L Y Y D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S T M R E F T G L V M Y S K G N E V I L D K T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F Y P E G G G Q P A D H G Y F E F K G K K I N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L D V Q K H G N A I V H K L D G E I P E G V R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K G V I D W E R R S R L M V H H T A T H L L L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
V L R D I L G D H V W Q S G V Q K D V S E S H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D I T H Y K R I D E D T I K K I E H R I F E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
T E G R P V S V K N L D W Y M A I G K Y G F R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F E G G V P L S P K V R V V E I E G V D A E G C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G G T H L K N I S S I G V L K I K K I E A I Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
N I Y R I T F V A G V P A L E L F E D S Y D L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Y R V S N I S K K N I D Q A G D F V E N T V R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L S K I K R D L D S A R T K L I E E E I R K S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
S I K L G E K E I P A I E A E T S D I D I V S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I A H S K G I E V I I E S R V G T K F R Y T A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S P S G K S K Q I L H D L L H T D A E G N D K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878
S Y V I V D H K E L S I T R
- - - - - - - - - - - - - -
------------------------------------------
Class II
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_ala_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V K A N E N E Y R L N F F L S R G Y E R K I C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R S C S T P F W T L D K L K E N C S D V P C T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y Y F F D I N I K S P P L T V R E S R E K F L R
- - - - - - - - - - - - - T V R E S R E K F L R
---------------------------------------GCCTCTGATACTAATTACAATATTTTGATTGTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F F E K R G H T I V P P K P V V A K W R D D L Y
F F E K R G H T I V P . K P V V A - - - - - - Y
AGATGTGATCTTCCTCATTACTTCTTTTATAAG---TTCATCTATGAAGTC------------------AAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L T I A S I V D F Q P F V T S G L A K P P A N P
L T I A S I V D F Q - - - - - - - - - - - - N P
TCCATTGACGCTTATTCTCTCTGCAATCTC------------------------------------TAACAA
121122123124125126127128129130131132133134135136137138139140141142143144
L V V S Q P C I R L E D V D N V G I T F G R H L
L V V S Q P C I R L - - - - - - - - - - - - - -
ATTCTGCAAGTTCTCATGTTCTTCTAAATG------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T T F E M A A H H A F N Y P D K Q I Y W K D E T
T T F E M A A H H A F - - - - - - - - - K D E T
TAATTTCGAGATTTCATTTAATTTCTCGTCCTG---------------------------ACCAGCTACATA
169170171172173174175176177178179180181182183184185186187188189190191192
V A F A K E F F T E E L G I P E D Q L N F K E S
V A F A K E F F T - - - - - - - - - - - - - - -
TTCTAGTCTTATTACACCGTCTTGAAG---------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W W E G G G N A G P C F E V T V G G L E L A T L
- - - - - - - - - - C F E V T V - - - E L A T L
------------------------------ATCCCAATTTTCTATTTC---------TATCTCAGATCCTTC
217218219220221222223224225226227228229230231232233234235236237238239240
V F M Q Y E I R G Q D Y V P L K L K I V D T G Y
V F M - - - - - - - - - - - - - L K I V D T G Y
AGGTATTCC---------------------------------------AGTCCTCTCAATATATAGTGGTCT
241242243244245246247248249250251252253254255256257258259260261262263264
G V E R I A W F T Q R T P T A F H A I Y G N L V
G V E R I A W F - - - - - - - - - - - - - - - -
AACTTTTCTGCGGTCATTAATTAT------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G S F Y K K I G V S E V N N E L L K A A A I Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G R I D P D I K E T I T T H R E H L A K Q L G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D L K Y V N E E L T R A A R V F Q V L D H T K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I A L M L A D G L V P S N S G E G Y L G R L L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R R A L R V L R L L G S D V K L H E L I K D Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D Y W K E D F P Q M L K N K N Y I I D A V I N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E E K Y N D T I S K I P S I L S T L S K K S K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D L D E L I N I Y D S N G I S P D L I L D E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K R N I N I S V E I P H N F Y S I V A K K H Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A L V R E N K K D K I P K E V I D E I N N K K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E P T V P L Y Y K D Q Y L R T F N A K V L L N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K N F L V L D Q T T F Y P E G G G Q I G D T G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I R S I E G N K Q V K V V D T Q K Y K G V I V H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I L D K D S P F I Q G E Q V Y G E I D W Q R R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R I M K H H T V T H V I L S A T R K V L G E H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
W Q A G A E K T E Y K G R L D V T H Y K L P T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E E I R K I E D F A N Y I I N D R R K V R P L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
I E R T E A E M K Y G V S I Y A G G I P E G S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
I R L I E I E N W D I E G C G G T H L I N T G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
I G G V K I V N V E K L Q D G V I R L E Y V A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D M V S N Y A R Q Q D E K L N E I S K L L N S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I S Q I N V R L K K H L E E H E N L Q N L L D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
Y R K I L L D R I Q E I A E R I S V N G I T I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I L R D F I D E Q L I K E V M R K I T S N N Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
I V I S I R G K D T K N V E I A T S K D I K V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K I V D E L R K I G G R G G G K G T Y G S V S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907
T V E E E K I I D T I K S A I T N G V
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_ala_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K W M K V D P S E F E L E F F E E I G F E R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R C P E C G E Y F W G P P E A E V C N E T P C V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E Y S F I G D P P A S V K L D V W E A G E E F F
- - - - - - - - - - - - - - D V W E A G E E F F
------------------------------------------GACGTATGGGAGGCCGGAGAGGAGTTCTTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R F F E R H D H E V L D R Y P V V A R W R D D I
R F F E R H D H E V L D . Y P V V A - - - - - -
CGGTTCTTCGAACGGCACGATCACGAGGTCCTCGAC---TACCCCGTCGTCGCC------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H L T I A S I A C F Q P W V T S G E V P P P A N
H L T I A S I A C F Q - - - - - - - - - - - - N
CACCTGACTATCGCCTCGATAGCCTGCTTCCAA------------------------------------AAC
121122123124125126127128129130131132133134135136137138139140141142143144
P L V I N Q P C I R L N D I D N V G R T G R H F
P L V I N Q P C I R L - - - - - - - - - - - - -
CCTCTAGTGATCAACCAGCCCTGTATACGGCTC---------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T L F H M G G H H A F N N H P H D R R D I Y W K
T L F H M G G H H A F - - - - - - - - - - - - K
ACGCTCTTCCACATGGGAGGCCACCACGCCTTC------------------------------------AAG
169170171172173174175176177178179180181182183184185186187188189190191192
E E T V R L C Y E F T V E K L G I P E E K I A F
E E T V R L C Y E F T V - - - - - - - - - - - -
GAGGAAACCGTGCGCCTGTGCTACGAGTTCACCGTG------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K E S W W E G G G N A G P C F E V V V D G L E L
- - - - - - - - - - - - - C F E V V V - - - E L
---------------------------------------TGCTTCGAGGTGGTGGTC---------GAGCTC
217218219220221222223224225226227228229230231232233234235236237238239240
A T L V F M Q Y E Q V G G E Y R E L P Q K I V D
A T L V F M - - - - - - - - - - - - - Q K I V D
GCGACGCTGGTGTTCATG---------------------------------------CAGAAGATCGTCGAC
241242243244245246247248249250251252253254255256257258259260261262263264
T G Y G I E R Y A W I T T G E P T A Y D A V F G
T G Y G I E R Y A W I - - - - - - - - - - - - -
ACCGGGTACGGTATCGAGCGGTACGCGTGGATA---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D L V D A T A R D L G V E I D G E A R E I L G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L A R V A G L M D V E T E S D L R V L R N R V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R R L D L D V N E L V R V A E P V E F V Y G I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D H A R C L A F M L G D G V V P S N A G E G Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A R L V I R R A L R L L D G L D A E R E Y L L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V V E R V L E D L R G T Y P E L A E R E E Y I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D A L E C E I D R Y T R A L K R G K K E V R K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L E E K G E L S F E D L V E L Y D S H G I P P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V A R E I A E D E G V E V E V P D D F Y S R V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E R H E G P E E V E E G L E E L E R I A V E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L P E T E L A F Y D D E K R L E F K A E V I G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y E V N G D A W V V L D R T Y F Y P E G G G Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A D R G T M R W K D G E A E V K D V Q K V R G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V F H R I D G D V P P E G A E V E C E V D G E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R M R L T R N H T A T H V I L E A A R R V L G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
H V W Q A G A H K S T D E A R L D V T H H R R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S D E E L R E I E R L A N E I V M K D L P V N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R F M D R N E A E R R Y G F E L Y Q G G V V P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
R E I R V V E I E G W N V Q A C A G T H C D S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
G E I G P I K I V G R E R I Q D G V E R I R F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
A G E A A L E R I W E T E D L L R E T C E V L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
V N P E N L P K T V K R F F E E W K E Q R K R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E R L E R E L V E A K L R A A P A E G R R V G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
F T V T L V E L E D V E V G S V A G T V E E L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K E H E N L V L V A K I V S N G S C Q V V V G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G E S A P P A G E L M R E I G K L I E G G G G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
D E R L A Q G G G R N P D G L T E D R L V E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918
E D L A G G
- - - - - -
------------------
Class II
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_ala_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M M E D E Y Q L E Y F K S E G L T R N I C S S C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G K A F W T R N P D R M V C G D A P C E P Y Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I G N P I F R A K T V D E M R E A Y L S F F E K
- - - - - - - - - T V D E M R E A Y L S F F E K
---------------------------ACTGTAGATGAAATGCGGGAAGCATATCTCTCCTTTTTTGAGAAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q G H T R I D R Y P V A A R W R D D I Y L T I A
Q G H T R I D . Y P V A A - - - - - - Y L T I A
CAGGGGCATACCCGGATTGAC---TATCCGGTCGCTGCA------------------TATCTGACAATTGCA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S I A D F Q P F V T S G V V P P P A N P L T I S
S I A D F Q - - - - - - - - - - - - N P L T I S
TCGATCGCAGATTTTCAG------------------------------------AATCCCCTTACCATCTCT
121122123124125126127128129130131132133134135136137138139140141142143144
Q P C I R L N D L D S V G R S G R H L T C F E M
Q P C I R L - - - - - - - - - - - - - T C F E M
CAGCCCTGTATCCGTCTC---------------------------------------ACATGCTTTGAGATG
145146147148149150151152153154155156157158159160161162163164165166167168
M A H H A F N S D E K E I Y W K D R T V E L C D
M A H H A F - - - - - - - - - K D R T V E L C D
ATGGCTCATCATGCCTTC---------------------------AAAGATCGCACGGTTGAGCTCTGTGAT
169170171172173174175176177178179180181182183184185186187188189190191192
Q L L T S L G A N K E M V T Y K E H P W I G G G
Q L L T - - - - - - - - - - - - - - - - - - - -
CAGCTCCTGACG------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N A G P S V E V L I G G L E V A T L V F M S L G
- - - - S V E V L I - - - E V A T L V F M - - -
------------AGTGTGGAGGTTTTGATA---------GAGGTTGCAACGTTGGTGTTCATG---------
217218219220221222223224225226227228229230231232233234235236237238239240
K Q K T E K P P I E L E G T P Y Y P M T L R I V
- - - - - - - - - - - - - - - - - - - - L R I V
------------------------------------------------------------CTTCGGATTGTC
241242243244245246247248249250251252253254255256257258259260261262263264
D T G Y G L E R F V W A S Q G S P T I Y D A V F
D T G Y G L E R F V W A - - - - - - - - - - - -
GATACGGGGTATGGACTTGAACGGTTTGTCTGGGCA------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P E M V S H V M Q E A G F G H R L H D S D F I H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I L G E N A K F A G L M D I S G Q R I F E L R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K V A E K I G I P T D K L E K M I A P V E S V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A I V D H T R C L S Y M L G D C I V P S N A K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G Y L A R L V L R R T L R M M R E L D L P D E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L G D L I E R Q M K I I G L S K F E Q D P D V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
M E I V D R E V D K Y R T T M E R G A R T V E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L A Q T Y K K K C E K I P L D E I I T L Y D S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G I P P D M V K D L A T S Q G A V V D L P D D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y S R I A N M H S E S E Q I Q E K N P L F D Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D R L A H L P E T R K L F Y E R P G S M E F E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K V L E I F D G Q Y V V L D Q T L F Y P E G G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q P G D T G L F L T P D G L T V R V C D T I K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G E S I L H R I D G G N V R K G D M I R G I L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E D R R L S L M R H H T A T H I L L H A A K E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L G A H I H Q A G A Q K G E Y S S R I D I R H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K H I T P E E L K K I E V V A N R L V M A N S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
T S I A W E D R T D A E Q K Y G F C L Y Q G G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P P G S R I R V V K V A G D I E A C A G T H C A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
H T G D I G T I S I I R V E H V Q D G V E R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
F A A G I A A I Q H K H H Q E D L L N R S A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
F S V Q V E A L P A T S K R F F D E W K E Q R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E I E K L S S R I S E L E S K N L E T V D Y N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I S V L V K R L D L P N P E L V K V A T G I S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K G G I A I L V A G G E T A R V V V S S G Q K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V K A G D V I S T V C A V L G G K G G G K P T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
A Q G G G P D V S K I D D A L A A G E S F I K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916
A L H V
- - - -
------------
Class II
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_ala_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I T M S H Q L E K L G Y R K Y E C R S C G N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F W S M K E R A T C G D A P C D E Y G F I G N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A T D R S Y D L Y E I Q D K F M E F F A E R G H
- - - - - - D L Y E I Q D K F M E F F A E R G H
------------------GACCTCTATGAGATACAGGATAAATTCATGGAGTTCTTCGCCGAAAGGGGCCAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E P I R R Y P V L A K R W R D D V F L V G A S I
E P I R . Y P V L A - - - - - - - F L V G A S I
GAACCCATCAGG---TACCCGGTACTTGCA---------------------TTCCTTGTCGGGGCATCAATA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y N F Q P W V T S G L V K P P A N P L V V A Q P
Y N F Q - - - - - - - - - - - - N P L V V A Q P
TACAACTTTCAA------------------------------------AACCCCCTCGTGGTTGCGCAGCCA
121122123124125126127128129130131132133134135136137138139140141142143144
S I R L N D V D N V G R T G R H L T C F T M G G
S I R L - - - - - - - - - - - - - T C F T M G G
TCAATAAGACTC---------------------------------------ACATGCTTCACAATGGGGGGT
145146147148149150151152153154155156157158159160161162163164165166167168
H H A F N S E D N T V Y W E E E T I K Y C H D F
H H A F - - - - - - - - - E E E T I K Y C H D F
CATCATGCATTC---------------------------GAAGAAGAAACCATAAAGTACTGTCATGACTTT
169170171172173174175176177178179180181182183184185186187188189190191192
L T H I G I D P S E I T F I E S W W Q G G G N E
L T - - - - - - - - - - - - - - - - - - - - - -
TTAACA------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G P C Y E V C V R G V E L A T L V F I Q Y R T L
- - C Y E V C V - - - E L A T L V F I - - - - -
------TGCTATGAGGTATGCGTC---------GAACTTGCAACCCTCGTCTTCATA---------------
217218219220221222223224225226227228229230231232233234235236237238239240
P D G G R E E I P L K I V D T G Y G L E R F A W
- - - - - - - - - L K I V D T G Y G L E R F A W
---------------------------CTCAAGATAGTTGACACAGGCTATGGCCTTGAAAGGTTCGCCTGG
241242243244245246247248249250251252253254255256257258259260261262263264
I S Q G T P T A Y D A C L G P V I E K L V E L T
I - - - - - - - - - - - - - - - - - - - - - - -
ATA---------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G V K I D E E I L A E N A Q V A G M M D I E T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A D L R E L R K R V A D K L G I S V E E L E R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A A P M E S V Y A I A D H T R C L A F M L A D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V I P S N V K E G Y L A R L I I R R T L R L M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D L G M K E S L K D I M N I Q V E F L E G H Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I R S H H E H I L N I I D L E E H R Y A R T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K R G R R I V E K T I K Y L K R D G K A E M P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E I L I K L Y D S H G I P P E T I G E I A E E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G F Q V K I P D N F Y T L V A E R N E T E T E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P E E D V H L D Y P A T E L L F Y D E P D D L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F Q A E V I G I H E N G L I L D R T L F Y P E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G G Q P S D T G Y I T A E G C R L R I K H A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I G A V V V H R T D D E I C I E P G T T I R G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I D S D R R L Q L T R N H T A T H L I V S A A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K V L G D H I W Q A G A Q K G V K S S R L D L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
H Y R R I T L E E L Q E I E R L A N E Y V M M N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
V P L K V R W M D R D L A E R K Y G F I L Y Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G V V P G S R I R V V E I P G V D V Q A C A G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
H V H R T G D I G L I R I N R T E R I Q D G V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R I E F S A G S A A I E I M Q K T G D I L R E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S D I F K V T P S Q L P G T C E R F F T E W K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L R N E V S R L K E K V A S L K I L E M K D R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E R I N D L T V I I D T V D A D M D E M K N M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L E L S A T V D A V V L A N P E G K I V G A A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E D A V K A G L R I N E V I S Q A A A V L G G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G G G R P H L A Q G A G P A T D K V D E A L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898
A R A A L S T V R N
- - - - - - - - - -
------------------------------
Class II
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_ala_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E I K H D Y N V Q L F K E K G F I R K Q C K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
C N Q Y F W T L D P K R E T C G D S P C D E Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F I G S S I T N K E Y T Y N E M V K E F L N F F
- - - - - - - - - - - T Y N E M V K E F L N F F
---------------------------------AATAGAATTATCCTTTTCATTTACTAAATTATCGGCAAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K N G H T P I K R Y P V S A R R W R D D I L L
D K N G H T P I K . Y P V S A - - - - - - - L L
AGACATTAACTCCTTAGGAGCTCCCTC---TTTTTCAACCAATAA---------------------AAATTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T I A S I A V F Q P W V T K G I V K P V A N P L
T I A S I A V F Q - - - - - - - - - - - - N P L
ATCATTGAGATTTCCTTTTTCCAATTC------------------------------------TTGTTCCTT
121122123124125126127128129130131132133134135136137138139140141142143144
V I A Q P C I R L N D I D N V G R T G R H M T C
V I A Q P C I R L - - - - - - - - - - - - - T C
CCATTCTTCGAAAAATCTATTTACGGT---------------------------------------GGCATT
145146147148149150151152153154155156157158159160161162163164165166167168
F T M G G H H A F N T D E D F K Y W T D R T V E
F T M G G H H A F - - - - - - - - - T D R T V E
TAATAAAATATCCTCCATCAGACTTAC---------------------------ATATTCCAATCTTTCTAC
169170171172173174175176177178179180181182183184185186187188189190191192
L C Y N F F T N L G I D G S S I T F I E S W W E
L C Y N F F T - - - - - - - - - - - - - - - - -
TCCATCTTGAATTCGTTCTGT---------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G G G N A G P C Y E V I T H G V E L A T L V F M
- - - - - - - C Y E V I T - - - E L A T L V F M
---------------------GCCCTCAATATCCAATAT---------ATTTCCTGGAACTACTCCTCCCTG
217218219220221222223224225226227228229230231232233234235236237238239240
Q Y E K T E Q G D Y I E M P L K I V D T G Y G L
- - - - - - - - - - - - - - L K I V D T G Y G L
------------------------------------------CATAACCGTAGATTTGACTGGTATGGCATC
241242243244245246247248249250251252253254255256257258259260261262263264
E R F V W A S K G T P T V Y E A V F G D I I G K
E R F V W A - - - - - - - - - - - - - - - - - -
CAATACTATTTGATTTGC------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L M D D A N I N M N D I G P K I L A E S A T L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G L M D I E N V G D L R I L R Q K V A E K L N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D V N E L D S I L S P I E N I Y A I A D H T R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L A F M L G D G I V P S N V K D G Y L A R L L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R K T L R Y I K N V G L S L S L K D I V A M Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E N L K E I Y P E L M D M K E Y I M D V L E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E N K Y I Q T I T K G K G A V E R I A K S K D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I T L D D L I E L Y D S K G L P P E V V R D I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E E I N K K G S K N N K G N K T I K I T V P D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
F Y T I V A E R H E E K K E D S K S E K G E N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A E K S T I S I N L D D I P E T E L L F Y S N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y Q K E V E A K I L K I I G N V V I L D K T V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y P E G G G Q K Y D I G L I G N K K I I S V Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N N N G I V C H T V E N T D G L N E E D T I I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K L N W E N R L N L M R N H T A T H I I N A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S K V L G K H I W Q T G S N V E S N K A R L D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
T H Y K R I T R E E I K E I E K I A N Q I V L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
A I P V K S T V M G R N E A E Q K Y G F K I Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G G V V P G N I L R I L D I E G V D V E A C G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
T H C Q N T S E V G Y I K I L K T E R I Q D G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E R L E Y T S G I N S V N E V S L M E D I L L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A S S I V G V P C E N L P K T V N R F F E E W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E Q K K I I E E L H K K I G E L E K G N L N D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
F E K V G K Y D L L V E K V E G A P K E L M S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A D N L V N E K D N S I V I L L N N S G Y I L C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K C G E K V E I K M G E L L R K I A K G G G K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910
K M A Q G K C A D D I E T L K S K V V G E L
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_ala_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L E D E Y Q L D F F K N N G F V R K Q C Q K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G K F F W T R D P E R N T C G D A P C D P Y S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I G S P V F S R E F N I S E M R E Y Y L S F F E
- - - - - - - - - - N I S E M R E Y Y L S F F E
------------------------------AATATTTCAGAGATGCGCGAATACTACCTCTCCTTCTTTGAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A R G H T R L D R Y P V V A R W R D D I Y L T I
A R G H T R L D . Y P V V A - - - - - - Y L T I
GCAAGAGGGCATACAAGGCTTGAC---TATCCTGTGGTAGCC------------------TACCTGACCATT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A S I A D F Q P F V T S G Q V P P P A N P L T I
A S I A D F Q - - - - - - - - - - - - N P L T I
GCTTCAATCGCAGACTTCCAG------------------------------------AACCCCCTGACGATT
121122123124125126127128129130131132133134135136137138139140141142143144
S Q P C I R L N D L D S V G R S G R H L T N F E
S Q P C I R L - - - - - - - - - - - - - T N F E
TCCCAGCCCTGCATCAGGTTA---------------------------------------ACTAATTTTGAA
145146147148149150151152153154155156157158159160161162163164165166167168
M M A H H A F N K R G N E I Y W K E H T L E L C
M M A H H A F - - - - - - - - - K E H T L E L C
ATGATGGCTCATCACGCTTTC---------------------------AAGGAACACACTCTGGAACTCTGC
169170171172173174175176177178179180181182183184185186187188189190191192
D E L L T S L K V D P F A V T Y K E E P W A G G
D E L L T - - - - - - - - - - - - - - - - - - -
GACGAGCTCTTAACC---------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G N A G P C V E V I V H G L E L A T L V F M D L
- - - - - C V E V I V - - - E L A T L V F M - -
---------------TGTGTTGAGGTTATCGTG---------GAGCTTGCGACCCTTGTTTTCATG------
217218219220221222223224225226227228229230231232233234235236237238239240
K T D K K G D I L I K G E T Y S K M D N Y I V D
- - - - - - - - - - - - - - - - - - - N Y I V D
---------------------------------------------------------AATTACATCGTGGAT
241242243244245246247248249250251252253254255256257258259260261262263264
T G Y G L E R F V W A S K G S P T I Y D A L F P
T G Y G L E R F V W A - - - - - - - - - - - - -
ACCGGCTACGGTCTTGAGCGTTTTGTCTGGGCT---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G I V N E L M G L A G L E H E L N N T E Y S N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L A Q N A R L A G F M D V S E K A N L L E L R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K V A S S I G M T V D K L S V I M E P V E K V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A I T D H T R C L T F M L G D G I I P S N V K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G Y L A R L V L R R T L R M M K D L D I R T P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S E I V D M H I R N M P E Y P E F R A N F P V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q D I L E S E E E K F N I T M E R G R R I I Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S A S H F K K T G E K I P L S Q L T E L Y D S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G I P P E M A K E V A A D I G V G V E F P D N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y S I I G E L H N K A E E K E E E V I P F A E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L K H L P K T K R R F Y D E P T R L E F E A V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L D V F D N H I V L D N T F F Y A E G G G Q P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D I G T I S V G D I V Y K V V D V Q V Y E G V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V H T V D I P D G E L E I T K G D I I T G K V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E R R R M T L A R H H T A T H I V N D A A R K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L G K H I W Q A G A Q K F E D H S R L D L S H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K H I S P E E L K Q I E L L A N R T V M E N K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
V I T E W M P R I E A E Q V Y G F G L Y Q G G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P P G E K I R I V K V G D D V E A C G G T H C L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S T G V I G P I K I L K T E R I Q D G V E R V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
F A A G I A A V R A M Q K M E S L L V D S A K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L S V P P E H L P V S V E R F F G E W K D L K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E N E R L K E D L A R S R V Y R M L G D A S E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A G L R V V S E Q V P G A D S L E L Q K I A T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L L K Q E N V V T L L A S D L E G V K L V A S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G E K A I E C G I N A G N L V R E M S K I V G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
G G G G K P A L A M G G G T D P T R I Q D A L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925
R G L E L V K E A C K E A
- - - - - - - - - - - - -
---------------------------------------
Class II
Archaea/Staphylothermus marinus/Smarinus_ala_aa
Archaea/Staphylothermus marinus/Smarinus_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V E E E F M N E F L K K T G Y Q V Y K C K K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G E R F W S L V P R D T C P D R P C S K Y D F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y N E Y K G V P P L T F D E A R R K F I E F F T
- - - - - - - - - - T F D E A R R K F I E F F T
------------------------------ACATTTGATGAAGCAAGAAGGAAATTCATAGAATTCTTTACC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S H G H G Y V D P Y P V L A R W R N D L Y L T I
S H G H G Y V D . Y P V L A - - - - - - Y L T I
TCTCATGGACATGGATATGTTGAC---TACCCAGTTCTTGCT------------------TATTTGACAATT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A S I I V F Q P A V T E G I V D P P Y N P L V I
A S I I V F Q - - - - - - - - - - - - N P L V I
GCGTCAATAATTGTTTTTCAA------------------------------------AATCCGCTAGTCATA
121122123124125126127128129130131132133134135136137138139140141142143144
V Q P S V R L E D I D N V G L T F G R H L T S F
V Q P S V R L - - - - - - - - - - - - - - T S F
GTTCAGCCCAGTGTTAGGTTG------------------------------------------ACAAGTTTT
145146147148149150151152153154155156157158159160161162163164165166167168
E M G G H H A F N K K D Q Y V Y W V N E T L Q Y
E M G G H H A F - - - - - - - - - V N E T L Q Y
GAAATGGGAGGACATCACGCATTT---------------------------GTAAACGAAACACTTCAATAC
169170171172173174175176177178179180181182183184185186187188189190191192
A F D F F T K I I G I E P E N I V F K E S W W E
A F D F F T - - - - - - - - - - - - - - - - - -
GCATTCGACTTCTTTACA------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G G G N A G P A Y E V L V D G L E L A T L V F M
- - - - - - - A Y E V L V - - - E L A T L V F M
---------------------GCATACGAGGTTCTAGTT---------GAGCTTGCCACACTAGTATTTATG
217218219220221222223224225226227228229230231232233234235236237238239240
K Y K I V N G K K V R N P V L V V D T G Y G I E
- - - - - - - - - - - - - V L V V D T G Y G I E
---------------------------------------GTACTCGTAGTTGATACTGGTTATGGTATAGAG
241242243244245246247248249250251252253254255256257258259260261262263264
R I A W F T Q R T P T A F H T I F S S L L E T Y
R I A W F - - - - - - - - - - - - - - - - - - -
AGAATTGCCTGGTTT---------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K N I L G I D E P P Y D V L K K I V Y L L S D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E I E D V Y M L N K Y L E E I D Y S E Y Y K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V D T I N L Y T A L D H V K T L S L M L S D G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V S S N T G E G Y L A R L V I R R L L R T L I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L G I K V S T L E D I V L E L I D K Q A K Y W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G R Y V Y D K F H R R L D Y I L D V M S Y E T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K Y I D I V T R G I R E V D R F I K K K K K I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F D D L I Q I Y D S K G I P P E I V V E R A K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Y G Q E I R V P S N F Y S L I A A R H G G S Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L I K E K E H E L P D E I V E W A S K H D P T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K L F H E N P Y L R R A S A K V L D S L N E Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I F D Q T I F Y P R A G G Q D H D K G Y V I L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
N E H I P V K H V Y K V G E V I V H Q L A T K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R L V P G T Q V E L V I D W Y N R Y R L M R H H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T A T H I V L G A A R K V L G E H V W Q A G A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K T V E K A R L D I T H Y K S L S D E E I R K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E E L A N K V I D E R I D L K F Y F L P K F E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E K R F G L R I Y Q G G A V Y S P I L R I V E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P G W D A E A C F G T H V Y N T S E I G G I K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
I K A E K I Q D G V I R L E Y I A S T R L P E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
I S D L Q K E V D K A L K F L G A K G L P I S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
V A K K V S E E L D K Y K T L L I Q Y R R L F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E I L L K H L L E E A L E I C G L K T V V I E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
Q L E D E Q L Y K S I I E D L S L K K R V L T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
Y V S D K F V E I A I H P D E A N N R K L D L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K L V E I L Q N M G G R G G G K P D H I Y I K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909
K E P K Q I V K L I V E A I T N L L C K A
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_ala_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K H N Y K V K L F D E L G F V R K K C K K C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q W F W T L D E E R E T C G D A P C D I Y S F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G K P I T K K P Y T Y K E M V K E F I N F F K E
- - - - - - - - - T Y K E M V K E F I N F F K E
---------------------------ATTCAATAACACAACTATGGCATTTTCAGTAGCTAAGTTATCAGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H G H E P I K R A P V T A R R W R D D I L L T I
H G H E P I K . A P V T A - - - - - - - L L T I
TATGTTCAACATCTCTTTTGG---AGCCTCAACTTTCTC---------------------AATTGTCTCAAA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A S I A V F Q P W I T K G I V K P K A N P L V I
A S I A V F Q - - - - - - - - - - - - N P L V I
TTTATTTATTAATTCAAATTT------------------------------------CTTCTTTCTCTGCTC
121122123124125126127128129130131132133134135136137138139140141142143144
A Q P C I R L N D I D N V G R T G R H L T C F T
A Q P C I R L - - - - - - - - - - - - - T C F T
CTTCCACTCTTCAAAGAATCT---------------------------------------AATCTCAGCACT
145146147148149150151152153154155156157158159160161162163164165166167168
M G G H H A F N R E D D F K Y W Q D E T V E L C
M G G H H A F - - - - - - - - - Q D E T V E L C
CTCCTCTAATATATCCTCCAT---------------------------GCCACTTGAATAAATCAGCCTTTC
169170171172173174175176177178179180181182183184185186187188189190191192
F N F F K K L G I D E K S I T F I E S W W E G G
F N F F K - - - - - - - - - - - - - - - - - - -
AACACCATCTTGAAC---------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G N A G P C Y E V I T H G V E L A T L V F M Q Y
- - - - - C Y E V I T - - - E L A T L V F M - -
---------------AACATCAACGATATTTCC---------TTCAATAATAACAATCCTTAAAAC------
217218219220221222223224225226227228229230231232233234235236237238239240
E K V G D N Y K E I P L K I V D T G Y G I E R F
- - - - - - - - - - - L K I V D T G Y G I E R F
---------------------------------AAATTTCTCCTCTGCCTCATTTCTATCCATAAATATACT
241242243244245246247248249250251252253254255256257258259260261262263264
V W A S T G E P T I Y D A I F K N I V N K L K E
V W A - - - - - - - - - - - - - - - - - - - - -
CTTTATGTT---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D A G V K D I D K E I L A K I T E V A G L M D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D V G D L R K L R E E V A N K V N I P V E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D K L I S P Y E D I Y A I V D H T R A L A F M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G D G I V P S N V K D G Y L V R M L I R K T L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H M D R L N L S T P I T E I V A M Q L N E L K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L Y P E L L D M E D Y I M E I L E I E T N K Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q T I E R G K G I V E R L L K S K K E I D L E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L I E L Y D S H G L P P E I V K D V A K S L G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D V K I P D N F Y T I V A E R H E N K K E V K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K I K L P E V N V D K T E L L F Y E Y P K M K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F E A K I L R I V D D Y V I L D R T A F Y P E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G G Q K A D T G Y I I K G D K K F R V V D V Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E N N I V Y H K I E N L N D E L K E G D I V K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V I D W K R R L S L M R N H T A T H I I N A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q K V L G R H V W Q A G S D V D V D K A R L D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
T H Y K R I S R E E L K D I E R V A N E I V L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
N Y N I K S I F M D R N E A E E K F G F R I Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G G V V P G N V L R I V I I E D E N G N I V D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Q A C G G T H C Q N T G E V G F I K I I K T E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
V Q D G V E R L I Y S S G L S A L K A V Q E M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D I L E E S A E I L R C P T E E L P K V I K R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
F E E W K E Q R K K I E E L E K K I G E L K K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E L I N K F E T I G N Y K V L V E K V E A N P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E M L N I A D N L A T E N A I V V L L N D K G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
I L C K R G E N V D I K M N E L I R Y I A K G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G R E H L A Q G K Y E G D V E E I K K K V I E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892
I K N K
- - - -
------------
Class II
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_ala_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H V D P K E Y E L E F F K E K G F I R R R C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I G G E Y F W T L N P E Q E H C N D A P C V E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y F W D V P K R S T D L S V A E A R R K F L R F
- - - - - - - - - - - - S V A E A R R K F L R F
------------------------------------GGAGGCCTTGGAGCCGGCGCCAACCTCTACCACAAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F E R N G H E I I E P R P V V A R W R E D L Y L
F E R N G H E I I E . R P V V A - - - - - - Y L
ACCCTGCTCAACTGGCACCAGCGCTACTGT---GCCCTCCGGGTCCTC------------------AGCCTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T I A S I V V F Q P H V T S G I V P P P A N P L
T I A S I V V F Q - - - - - - - - - - - - N P L
CTGGTAGAGTTCGCGGAGGGGGATATC------------------------------------CAGTGGGCT
121122123124125126127128129130131132133134135136137138139140141142143144
V I V Q P S I R L E D I D N V G L T L G R H L T
V I V Q P S I R L - - - - - - - - - - - - - - T
GCTCTTAGCCTTCTCCACCATATCCTT------------------------------------------ATT
145146147148149150151152153154155156157158159160161162163164165166167168
S F E M G G H H A F N Y P D K R V Y W K E E T V
S F E M G G H H A F - - - - - - - - - K E E T V
GTAGTCGCGTATAAGCTTCTCTACGCGCTT---------------------------CATCCTGGCTATATT
169170171172173174175176177178179180181182183184185186187188189190191192
R L A F E F F T E E L G I P P E H V T F K E S W
R L A F E F F T - - - - - - - - - - - - - - - -
GTTTAGGCGGCTCTCCAGCTCGGA------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W E G G G N A G P S F E V T V G G L E L A T L V
- - - - - - - - - S F E V T V - - - E L A T L V
---------------------------TATCTTGACGGAGCCTAT---------GTTGGACACATGTGTGCC
217218219220221222223224225226227228229230231232233234235236237238239240
F M K Y R V V D G R Y E P I P V K V V D T G Y G
F M - - - - - - - - - - - - - V K V V D T G Y G
GAAGCA---------------------------------------CTTAGCCGACATGGGGACGCCGCCCTG
241242243244245246247248249250251252253254255256257258259260261262263264
I E R I A W F T Q R V P T A F H A I Y G S L L E
I E R I A W F - - - - - - - - - - - - - - - - -
ATATAGGCGGAAACCATAGAC---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D F H K L L G V E P P P S K L L W A A A R D A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R L D P E D P E S V R R F Y E R A A R D A G M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P R E A E E L L R R A A A V Y A L L D H S K T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A L M L G D G I V P S N T G E G Y L A R L V I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A L R L I R R L G S D A S L V E L V E R Q A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F W G R D Y Y P R M L E N L D Y I V K V T R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E E R F D R S I E R G L R E V A R L L R R K K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L S L D D L I L L Y D S H G L P P D M V A E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A K L G V R V H V P H N F Y A I V A R R H G A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G G V A R R S E K P S L P E D V V E W L R G F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E T V R L F H E D P Y M R E F T A R V L G V K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V Y L V L D R T A F Y P T G G G Q L H D T G V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R L C G E E Y R V V R V E K V D G V I V H V L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R E P P G G C S E A W G R I D W E R R Y R L M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
H H T A V H V L L G A A R R V L G N H V W Q A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A E K T P E K A R L D I T H Y E L P S S E E V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
R I E E L A N K A I L E R I P V E A R I M D R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E A E K V Y G F R L Y Q G G V P M S A K I R V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
R I G D W D V E A C F G T H V S N S A E I G S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
K I T R V E K L Q D G V V R F E L V A G S E V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
R Y A S E L E S R L N N I A R M V G G G A A D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E K R V E K L I R D Y N K T R Q S V N I L S K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V V K D M V E K A K S S P L A I D G L R V Y V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
R D D I P L R E L Y Q E A A K Q L S L E D P E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V T V A L V P V E Q G V V V E V G A G S K A S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
R V D L R Q L A R L L A S R G F R G G G K P S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
V T M M A R G L S A E E A L D A L L S A L R S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922
V E G K G G S G T G
- - - - - - - - - -
------------------------------
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_ala_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q K L T A A Q I R E T F I S F F K R H G H T H
- - - - T A A Q I R E T F I S F F K R H G H T H
------------TTCGGCCAACACGTCTACCGCAGCAGTGATAGCAGCCGCCAAGCGGTCGGGGGTCCGTCC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V P S S S L V V A D D P T L L F A N S G M V Q F
V P S S . L V V - - - - - - L F A N S G M V Q F
ACCGGCTTGCGC---TTCCGGTCG------------------GACGATAGCGGCAAGCGGTTTGACAATATG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K D V F L G R E Q R P Y T R A V T A Q K C L R V
K - - - - - - - - - - - T R A V T A Q K C L R V
CAC---------------------------------AACAATTGTAAGTAATTGCGGTTTACCGTTGATCTG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S G K H N D L E E V G P S P R H H T F F E M L G
- - - - - - - - - - - - - - - - - T F F E M L G
---------------------------------------------------CATCTCACGCAGGCGTTCGAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N F S F G D Y F K A E A I R L A W K L L T E E F
N F S F - - - - K A E A I R L A W K L L T - - -
CGAATCGGCTTC------------CAGCAGCGGAATCCCGGCGACCGTTTGCGTGCGATGTAC---------
121122123124125126127128129130131132133134135136137138139140141142143144
Q L P V E R L W F T V F A G D D E V P P D D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A A L W I A Q G A D P S R V L R F G R K D N F W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V M G D T G P C G P C S E I T I Y I G D D L S Q
- - - - - - - - - - C S E I T I - - - - - - - -
------------------------------CCCGGTCAGAGCCTCAAC------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
M R A E G V N S D D P N Y V E I W N N V F M Q Y
- - - - - - - - - - - - - - E I W N N V F M - -
------------------------------------------ATTCACGTGTGTGCCACCGCACAG------
217218219220221222223224225226227228229230231232233234235236237238239240
D R A T M Q P L P R P S V D T G M G L E R M A M
- - - - - - - - - R P S V D T G M G L E R M A M
---------------------------CTCAATTCCGGTACCGCGTTCAATGGTCACGACGCGCACGGTATC
241242243244245246247248249250251252253254255256257258259260261262263264
V M Q G V H S T Y D T D L F V S I I N R I I A V
V - - - - - - - - - - - - - - - - - - - - - - -
ACC---------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R G S D E E H Y Q A H R S A Y R A I A D H S R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I A F L I A D G V L P G N L G R P Y V L R R I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R R A A Y Q G R T I G F E R P F L A E V I T T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I D Q M G E V Y P E L V N R R E L I L S A A D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E E R Q F L R T L S G G L S R L N A V I E Q V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T R G E T V I P G T D A F V L K D T Y G F P L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L T Q K I A A E Q G L T V D E A G Y E A A M A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q R A R S R A A A A G K R G G E A D L W A E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L P A S H F T G Y E R L S D R A T V I G M L A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G D A I T S A M V G R Q V Q I V L D T T P F Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E S G G Q V G D T G V L V G P E G S V Q I E D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R R P L P G L I V H Y G R V V S G T I H V G D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V Q A T V D M V R R A D I Q R N H T A T H M L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R A L R D V L G E H A A Q A G S L V A P D R L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
F D F T H T K P L D P E E L R E I E R R L N A W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
V R A D A S V R W E I T G Y R S A I A R G A I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L F G E K Y G D T V R V V T I E R G T G I E N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E Y A S R D S L E L C G G T H V N R T G E I G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V R I L G E G S I G S G I R R V E A L T G R G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
E L W A E E Q A Q T L R D L A A R I N A Q P A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L I E R I E A L L A E N R Q R R Q E L E A L R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
K L A R E M L D T L V H R T Q T V A G I P L L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A E V E A D S V E R L R E M G E Y L R D K L G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
A V I V L G A Q I N G K P Q L L T I V T S D L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K R G L N A V H I V K P L A A I V G G G G G G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
P E I A Q A G G R T P D R L A A A I T A A V D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894
L A E Q V G
- - - - - -
------------------
Class II
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_ala_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P E P S A K D V R Q Q F L D F F A Q K H G H K
- - - - S A K D V R Q Q F L D F F A Q K . G H K
------------TCCGCCAAAGACGTCCGCCAGCAGTTCCTCGACTTCTTTGCGCAGAAG---GGGCACAAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V V P S A P V V P H G D P T L L F A N A G M N P
V V P . A P V V P - - - - - - L F A N A G M N P
GTCGTGCCC---GCGCCGGTGGTGCCC------------------CTGTTCGCCAACGCGGGCATGAACCCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F K P Y F L G E E V A T D K R V C D T Q K C I R
F K - - - - - - - - - - - K R V C D T Q K C I R
TTCAAG---------------------------------AAGCGGGTCTGCGACACCCAGAAGTGCATCCGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A G G K H N D L E D V G R D T Y H H T F F E M L
A - - - - - - - - - - - - - - - - - T F F E M L
GCC---------------------------------------------------ACCTTCTTCGAGATGCTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G N W S F G D Y F K K E A I R W A W E L L V D V
G N W S F - - - - K K E A I R W A W E L L V - -
GGCAACTGGAGCTTC------------AAGAAGGAAGCGATCCGCTGGGCGTGGGAGCTGCTCGTC------
121122123124125126127128129130131132133134135136137138139140141142143144
W G L E P E R L H A T Y F E G D E A E G L E P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L E A R D L W L Q L L P A E R V H P G N K K D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F W E M G D T G P C G P C S E L H Y D G T A D L
- - - - - - - - - - - - C S E L H Y - - - - - -
------------------------------------TGCTCGGAACTCCACTAC------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S G A A K V N A D D P D V I E I W N L V F I Q F
- - - - - - - - - - - - - - E I W N L V F I - -
------------------------------------------GAGATCTGGAACCTGGTCTTCATC------
217218219220221222223224225226227228229230231232233234235236237238239240
N R S T T G K L E P L P A K H V D T G M G F E R
- - - - - - - - - - - - A K H V D T G M G F E R
------------------------------------GCGAAGCACGTCGACACGGGCATGGGCTTCGAGCGG
241242243244245246247248249250251252253254255256257258259260261262263264
I V R V L Q G H S S N Y D T D V F T P L F E A I
I V R V - - - - - - - - - - - - - - - - - - - -
ATCGTCCGCGTG------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R E A T G A G P Y T G E L E K P E D V A Y R V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A D H I R T L V F A L A D G A H C D K D G R G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V L R R I L R R A V R Y G R Q T L G Q E Q P F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F E L V P A V V A N F G D A F P E L R E R A D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V A A E I R E E E E S F S K T L G R G I Q L F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L S A R R V E E A A G R G G G K T I A A T D A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q L H D T Y G F P L D L T E L M A A E R G M T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D A E G F D R L M G E A R V R S R G G G D G G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A A A M A S L R E E V Q R G F D A G W Y A G T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
F T G F E T A E A P F Q Q N Q I H V F R R Q D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H W L S L T A G E S A T A G D A V A I V L K M S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P F Y A E M G G Q V G D T G S I Q L R T G G R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A V R D T Q K V G A V H V H L G E V V S G E V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
T D P D V I L A V A V D L E R R R A I E A N H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
A T H L L N R S L R D R V S D D V Q Q R G S L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E A E R L R F D F N H G A A L G D D E L A A I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
G D L A A A I A A R R G V F S G N A P E A Q A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G I R G L R A V F G E K Y P P V V R V V S V G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P V D K L L A D P D N A A W E E L S V E L C G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
T H A G N T A D L G A F A L V G Q E A V G K G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
R R V T A V T G E P A V A A R E E A A R L M K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L D A A A G L D P E A V A A Q L D G L T K R V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A A T L P L A E R A A T R A K L A T L G E A V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K H R K E A G A Q A T D A V L D A A R A A A E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V A D G A V L V T G I D G A D G K S L R V A M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
V V N K L R P Q S P A M L A A T E D G K V S L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
A S V P K D K V Q A G W K A G E W V N A A A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
V G G R G G G K P D R A Q A G G K D P A K L P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949
A L D A A R A W T A D R G
- - - - - - - - - - - - -
---------------------------------------
Class II
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_ala_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P P K Q Y G M M G L I C S L S F I S L R Q S M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A A P A L S G D Q I R E T F L K F F E G K G H R
- - - - - S G D Q I R E T F L K F F E G K G H R
---------------AGCGGTGATCAAATCCGCGAAACCTTTCTGAAATTCTTTGAAGGCAAGGGGCACCGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R L P S A S L I P E D P T V L L T I A G M L P F
R L P . A S L I P - - - - - L L T I A G M L P F
CGCCTACCC---GCCTCGCTGATCCCT---------------TTGCTGACGATCGCAGGCATGTTGCCGTTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K P I F L G Q Q V A E V P R A T T S Q K C I R T
K - - - - - - - - - - - P R A T T S Q K C I R T
AAG---------------------------------CCACGGGCCACAACGTCGCAAAAGTGCATTCGCACC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N D I E N V G R T A R H H T F F E M L G N F S F
- - - - - - - - - - - - - T F F E M L G N F S F
---------------------------------------ACCTTCTTTGAAATGCTGGGCAACTTCAGCTTC
121122123124125126127128129130131132133134135136137138139140141142143144
G D Y F K K E A I A F A W E L V T E V F Q V P A
- - - - K K E A I A F A W E L V T - - - - - - -
------------AAGAAAGAAGCGATCGCCTTTGCTTGGGAACTCGTCACG---------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E R L A V S V F E E D D E A F A I W R D Q I G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P E A R I Q R L G A K D N F W A S G P T G P C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P C S E I Y Y D F H P E L G N D G L D L E D D S
- C S E I Y Y - - - - - - - - - - - - - - - - -
---TGCTCCGAGATCTATTAC---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R F I E V Y N L V F M Q Y N R D A A G N L T A L
- - - E V Y N L V F M - - - - - - - - - - - - -
---------GAGGTCTACAACCTCGTGTTCATG---------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E K Q N I D T G M G L E R M A Q V L Q G V P N N
- K Q N I D T G M G L E R M A Q V - - - - - - -
---AAGCAGAATATCGATACGGGCATGGGGCTGGAGCGCATGGCTCAAGTC---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y E T D L I F P I I Q A V A A I A Q R D Y A S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S E S V K V S L K V I G D H L R A V T H L I A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G V T A S N L G R G Y V L R R L I R R V V R H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R L I G I D R P F T A E I A E T A I A L M A A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y P N L R E R E A A I K A E L T R E E Q R F L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T L E R G E K L L A E L L A A A T D Q I R G E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A F V L Y D T Y G F P L E L T Q E I A E E K G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T V D L A G F E A A M A A Q R Q R S Q A A H E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I D L T V Q G S L D R L A E Q I H P T E F V G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G D A V A T A K V T A L L R E G Q S V E A A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G D R V Q I V L D H T P F Y A E S G G Q V G D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G V L T G E S L I V R I E D V Q K E S G F F V H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y G Q I E R G L L Q V G D S V T A Q I D R A C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R R A Q A N H T A T H L L Q A A L K L I V D E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I S Q A G S L V A F D R L R F D F N C P R A V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
P E E L R Q I E D Q I N Q W I A E A H G T V V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
V M P I A T A K A K G A V A M F G E K Y G A E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R V I D V P G V S M E L C G G T H V A N T A E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G L F K I I S E A G V A S G V R R I E A V A G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A V L E Y L N V R D A V V R D L S D R F K A K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E E L S D R V T A L Q E E L K A N Q K Q L T A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
K A E L A I A K S D A L V S Q A I P V G D A Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L V E T L T G V D A A A L Q T A A E R L Q Q K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G D A G A V V L G S S P E E G K V T L V A A F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
P A I I A K G L K A G Q F I G G I A K I C G G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G G G R P N L A Q A G G R D A S K L P E A I A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899
A L D Q L K T A I A S
- - - - - - - - - - -
---------------------------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_ala_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L T A K E T R D S F K N F F E S K G H Q I V P
- - T A K E T R D S F K N F F E S K G H Q I V P
------TCCTGCCAGTTCCAGTACCTTCTCAACAGCAGCGTTCAGTCCGTCCGGATTCTTGCCACCGGCTGT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S A P M V I K D D P T L M F T N A G M N Q F K D
. A P M V I - - - - - - M F T N A G M N Q F K -
---GAAGTGAGGTTGACC------------------CAGTTTGGCAGCTTCTTTCACCAGATTACCTGC---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I I L G N H P A K Y H R V A D S Q K C L R V S G
- - - - - - - - - - H R V A D S Q K C L R V - -
------------------------------CATAACAGTCAGCATTGGTTTATTGGCATCTACTGT------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K H N D L E E V G H D T Y H H T M F E M L G N W
- - - - - - - - - - - - - - - T M F E M L G N W
---------------------------------------------GATGTTCTTCACTACTTCGGCGGGCAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S F G D Y F K K E A I S W A W E Y L V D V L K L
S F - - - - K K E A I S W A W E Y L V - - - - -
CGGCAA------------GACTTTAATGCCGTTAATCTCTTGTACATTTTTCAGCAG---------------
121122123124125126127128129130131132133134135136137138139140141142143144
N P E H L Y A T V F E G S P E E G L E R D N E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A S Y W E Q Y L P K D H I I N G N K H D N F W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
M G D T G P C G P C S E I H I D L R P A E E R A
- - - - - - - - - C S E I H I - - - - - - - - -
---------------------------TGCTTCGATACGGCGTAC---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K I S G R D L V N H D H P Q V I E I W N L V F M
- - - - - - - - - - - - - - - - E I W N L V F M
------------------------------------------------ACAGAATTCAATGGATGAGCCAAA
217218219220221222223224225226227228229230231232233234235236237238239240
Q Y N R K A D S T L E P L P A K V I D T G M G F
- - - - - - - - - - - - - - A K V I D T G M G F
------------------------------------------GGCGATTGCGCCCAGTTCTTTCGCTTCTTC
241242243244245246247248249250251252253254255256257258259260261262263264
E R L C M A L Q G K T S N Y D T D V F Q P L I K
E R L C M A - - - - - - - - - - - - - - - - - -
GATAGGGATGTTGCGGTG------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A I A Q M A G T E Y G K N E Q N D I A M R V I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D H I R T I A F S I T D G Q L P S N A K A G Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I R R I L R R A V R Y G Y T F L G Q K Q A F M Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K L L P V L I D S M G D A Y P E L I A Q K E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E K V I K E E E E S F L R T L E T G I R L L D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T M A D T K A N G K T E I S G K D A F T L Y D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F G F P L D L T E L I L R E N G M T V N V E E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D A E M Q Q Q K Q R A R N A A A I E T G D W I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L K E G T T E F V G Y D Y T E Y E T S I L R Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q V K Q K N Q T L Y Q I V L D Y T P F Y A E S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G Q V G D T G V L V N E F E T I E V I D T K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
N N L P I H I T K K L P E H P E A P M M A C V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
T D K R A A C A A N H S A T H L L D E A L R E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L G E H V E Q K G S L V T P D S L R F D F S H F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q K V T D E E L R K V E H L V N A K I R A N V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L Q E H R N I P I E E A K E L G A I A L F G E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y G D H V R V I Q F G S S I E F C G G T H V A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
T G N I G M V K I I S E S S V A A G V R R I E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
Y T G A R V E E M L D T I Q D T L S D L K A L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
N N T P D L G V A I R K Y I D E N A G L K K Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E D F M K E K E A A V K E R L L K N V Q E I N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I K V I K F C L P M P A E V V K N I A F Q L R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
E I T E N L F F V A G T V D A N K P M L T V M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
S D N L V A G G L K A G N L V K E A A K L I Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
G G G G Q P H F A T A G G K N P D G L N A A V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872
K V L E L A G I
- - - - - - - -
------------------------
Class II
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_ala_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K L T S A E V R R M F L E F F Q E K G H T V
- - - - T S A E V R R M F L E F F Q E K G H T V
------------ACATCTGCCGAAGTGCGGCGCATGTTTTTAGAGTTTTTCCAGGAAAAAGGCCATACGGTG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E P S A S L I P V D D P S L L W I N S G V A T L
E P . A S L I P - - - - - - L W I N S G V A T L
GAGCCG---GCATCGCTCATTCCG------------------CTGTGGATCAACAGCGGCGTCGCGACGTTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K K Y F D G R I I P E N P R I C N A Q K S I R T
K - - - - - - - - - - - P R I C N A Q K S I R T
AAA---------------------------------CCGCGCATTTGCAATGCGCAAAAATCGATTCGCACG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N D I E N V G K T A R H H T F F E M L G N F S I
- - - - - - - - - - - - - T F F E M L G N F S I
---------------------------------------ACGTTTTTTGAAATGCTCGGCAACTTTTCGATC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G D Y F K R E A I H W A W E F L T S D K W I G F
- - - - K R E A I H W A W E F L T - - - - - - -
------------AAGCGTGAAGCGATCCATTGGGCATGGGAGTTTTTAACG---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D P E R L S V T V H P E D E E A Y N I W C N E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G L P E E R I I R L E G N F W D I G E G P S G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N T E I F Y D R G E A F G N D P N D P E L Y P G
N T E I F Y - - - - - - - - - - - - - - - - - -
AATACGGAAATTTTTTAT------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G E N E R Y L E V W N L V F S Q F N H N P D G T
- - - - - - - E V W N L V F S - - - - - - - - -
---------------------GAAGTATGGAACCTTGTCTTTTCG---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y T P L P K K N I D T G M G L E R M C S I L Q D
- - - - - K K N I D T G M G L E R M C S I - - -
---------------AAGAAAAACATCGACACCGGCATGGGCTTGGAGCGGATGTGCTCGATT---------
241242243244245246247248249250251252253254255256257258259260261262263264
V P T N F E T D L F M P I I R A T E Q I S G E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y G E D R E K D V A F K V I A D H I R A V T F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I G D G A L P S N E G R G Y V L R R L L R R A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R Y A K H I G I E R P F M Y E L V P V V G E I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H D Y Y P E V K E K A D F I A R V I R S E E E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F H E T L H E G L A I L S N V I E K A K S E G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D V I P G E D V F R L Y D T Y G F P I E L T E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y A A E A G M K V D H D G F E R E M E R Q R E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A R A A R Q D V D S M Q V Q G G V L G D I K D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S R F V G Y D E L V A S S T V L A I V K D G Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V E E V R A G E E A Q I I V D V T P F Y A E S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G Q I A D Q G T F A G E T G T A V V K D V Q K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P N G Q H L H S I V V E S G T V K K G A V Y T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R V D E A K R A R I I K N H T A T H L L H Q A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K D V L G R H V N Q A G S L V A P D R L R F D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T H F G Q V K P E E L E R I E A I V N E Q I W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S L P V D I F Y K P L E E A K A M G A M A L F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E K Y G D I V R V V K V G D Y S L E L C G G C H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
V P N T S A I G L F K I V S E S G I G A G T R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
I E A V T G E A A Y R F M S E Q L A I L Q E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Q K L K T S P K E L N A R L D G L F A E L K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E R E N E S L S A R L A H M E A E H L T R Q V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
D V N G V P V L A A K V Q A N D M N Q L R A M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
D D L K Q K L G T A V I V L A A V Q G G K V Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I A A V T D D L V K Q G F H A G K L V K E V A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
R C G G G G G G R P D L A Q A G G K D A Q K V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878
E A L N Y V E T W V K S I S
- - - - - - - - - - - - - -
------------------------------------------
Class II
Bacteria/Thermus thermophilus/amino acid sequences/Tthermophilus_ala_aa
Bacteria/Thermus thermophilus/nucleotide sequences/Tthermophilus_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R T A E I R E K F L S F F E G K G H L R L P S
- R T A E I R E K F L S F F E G K G H L R L P .
---GGGGAGGAGGCCGGGGAGGGCCTCCCGGGCCTTCCTGGGGTCCAGGCCGCCCCCCTGGGCCAGGGC---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F S L I P E D D P S L L F T S A G M A P L K P Y
F S L I P - - - - - - L F T S A G M A P L K - -
CTTGCCCCCGCCCCG------------------GAGGGCCCGGAAGAGGGCCCCCGCCTCGAGGCC------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F L G A K P I F G G R E W R R V T T C Q E C L R
- - - - - - - - - - - - - R R V T T C Q E C L R
---------------------------------------CGAAAGCACCAGGGCCACGTCCGCCCCCCGGGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V G D I E N V G R T S R H N T Y F E M L G N F S
V - - - - - - - - - - - - - T Y F E M L G N F S
CAC---------------------------------------GCCGGGAAGCTCCGCCACCGTCCACCTGAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F G D Y F K K E A I L W A W E F L T E H L K L D
F - - - - K K E A I L W A W E F L T - - - - - -
CCC------------CAGGGAAGCCCCCCCGCCGCCCCCCAAGGCCGCCTGGAC------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P G R L W V T V F E D D D E A Y E I W R D L V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V P E E R I G R F G E D E N Y W P G G A I T H G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P N G P S G P C S E I F Y D R G P A Y G T P D E
- - - - - - - C S E I F Y - - - - - - - - - - -
---------------------CACCCCGGCGGAGACCGC---------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T G P N T G S G D R F V E I W N L V F T Q Y D R
- - - - - - - - - - - - E I W N L V F T - - - -
------------------------------------CTTGGACTCAAGGCCCTCTAGGGG------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q G P I P G P G I L K P L P Q K N I D T G M G L
- - - - - - - - - - - - - - Q K N I D T G M G L
------------------------------------------GGCCATGGCCCCCTCCTTCCTCGCCTCCTC
241242243244245246247248249250251252253254255256257258259260261262263264
Y R V A A I L Q D V E D F Y R T D T F F P I I Q
Y R V A A I - - - - - - - - - - - - - - - - - -
CAGGGGCATGTAGCGCCA------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E V A R M S G R P Y E G K T S V S H R V I A D H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V R A V V A A L S D G A T F S N T G R G Y V I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R L L R R A L R H G Y L L G L S D P F L H R L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P L V A E L L G D F Y P E M R E N L P A V E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I R L E E E R F L E T L E G G L K R L D A L L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G L K P G E V L P G K E A F R L Y D T Y G F P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D L T V E I A A E R G Y G V D T E G F Q K A M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E Q Q S R S R A A M A F E R E I F K K G A Q V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E E L Y A E R G A T E F L G Y N A L E A E A E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L A L L A G D Q S L L E A G P G T E V Q V V L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K T P F Y A E G G G Q I G D F G L L E W P G G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A R V E T T R K T E R G I F L H K A R V E E G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L R V G E R V R A V V D P R R R D T E R N H T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
T H L L H A A L R A V L G P H V R Q A G S L V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
P D R L R F D F T H P E P L K P E E L E R V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L V N R W I M A D F P V T W R Y M P L E E A R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E G A M A L F G E K Y G E V V R V V R V E G S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L E G L E S K E L C G G C H V R R T G E I G A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
L I R S E E A V S A G V R R I E A V T G E E A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R F A R G S L N R L K A L A E R L E V G E A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E E R L E K L L A E L K E K E R E V E S L K A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L V Q A A L G G G G G A S L E E K G G L R W T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A E L P G L D A K A L R Q A A D D L V A R G A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V A L V L S G G Q A V L K L S P K A Q G M G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A G A L F R A L A E K A G G R G G G K G A L A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882
G G G L D P R K A R E A L P G L L P
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_ala_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K G S E L R Q R F L D Y F A R Q G H A V V P S
- K G S E L R Q R F L D Y F A R Q G H A V V P S
---CAGCAAACCGTTGGCTTCGGCTAAGGCTTGATCAAGCGCAGCCGCATCGCGACCGCCAGCTTGGGCAAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S S L I P A D N P T L L F T V A G M V Q F N D V
S . L I P - - - - - - L F T V A G M V Q F N - -
ATC---GCGACCGCC------------------GGCAGCCAAGGCTTTGACTAAATTGCCAGCATG------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F L G R E S R P Y S R A V S S Q K C L R I S G K
- - - - - - - - - S R A V S S Q K C L R I - - -
---------------------------GGCGAGCAGCAAAGGCTTGCCATCGATTACCGTGCC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q N D L E N V G P S P R H H T F F E M L G N F S
- - - - - - - - - - - - - - T F F E M L G N F S
------------------------------------------GCGGAAGCTATCAGCATCGCTGGCTTCAAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F G D Y F K K D A I R F A W E F L T Q E I G L D
F - - - - K K D A I R F A W E F L T - - - - - -
GCG------------TGGCGTGCCAGCTTGCTCAATTTTTTGGGCGAGCAAGCT------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P K R M W V S I Y E G D E Q I P A D E E A H D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
W L A Y M P A E R I L R F D A K D N L W S A G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V G P R G P C S E I H Y Y I G D D P D N Q V P E
- - - - - - C S E I H Y - - - - - - - - - - - -
------------------AGTTACTGCCTCGATCCG------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G V N S E D D T Y M E I W N L V F M Q Y N R D E
- - - - - - - - - - E I W N L V F M - - - - - -
------------------------------AACGTGAACACCACCGCAAAGCTC------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N G V L T L L P K P S I D T G M S L E R L A I V
- - - - - - - - K P S I D T G M S L E R L A I V
------------------------ACTTGCATTGCCACAACCAACGGTGACCACCCGCACCACATCGCCATA
241242243244245246247248249250251252253254255256257258259260261262263264
K Q G V F R S Y E T D L F T P I I H T V M E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G T G S D H Y Q A N S S A Y H V V A D H S R S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A F M I A D G L R P G N E G R S Y V L R R L V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R A A Y F G Q T I G F K A P F L A E T I A T V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D M M G A A Y P E L R S K Q A Y I A E V V T G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E E R F N K T L A G G L R Q L E A M L P N Q A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K A V F S G A D A F K L Y D T Y G F P L D L T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R I V A E R G L T V D L A G Y E A E L E A Q R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R G R G A A Q F K K G A V T E R W A E R N L A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T S F T G Y N E L E S W G H V L A L E F D G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L G T V Q R G Q E V A F V L D R T P C Y A E S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G Q M G D S G V L V G P H G T I V I D D V Q K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V P G V F V H R G K V S K G S V S L G E Q V T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
T V D A A R R R D I V R N H T A T H L L H R A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R D T L G D H A E Q K G S L V A P E R L R F D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N N Q K G L S S E Q L Q Q I E D Q V N A W I R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
D S K V E A A E M A L P Q A R E L G A M A L F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E K Y G D V V R V V T V G C G N A S D H I H T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S E A P V C S R E L C G G V H V A R T G E I G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
F K I V S E G S V A S G V R R I E A V T G R A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A E W V S Q Q A Q L I R T L G D K L G A Q P G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V E E K L D A L L L D Q K A R R D E I E R L R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E I A A G Q V D S L L A Q K I E Q A G T P L V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A R V E A S D A D S F R R L G E Q L R D K I G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G V V I L G T V I D G K P L L L A A A T A D Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K A G R H A G N L V K A L A A K V G G G G G G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
A D F A Q A G G R D A A A L D Q A L A E A N G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889
L
-
---
Class II
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_ala_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R Y M T S E E I R E A F L K F F E K K G H K I
- - - - T S E E I R E A F L K F F E K K G H K I
------------CTCTTCGAGACGTTCCAGAACGTCTTTTATCCTCTCCGGATGTCTTCCACCCGCTTGGGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L P S A S L I P D D P Q L L F T V A G M V P F K
L P . A S L I P - - - - - L F T V A G M V P F K
AAAATT---TCGGCCTCCTCCGTT---------------CGCTATGTTTCGTGCTATAGAGGAGGCATCGTA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P I F W G K V E P V Y T R V A T C Q K C L R T V
- - - - - - - - - - - T R V A T C Q K C L R T -
---------------------------------GAGGGAAACCTTGTTTTCGAACTTACTGAAGAGAAT---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D I E N V G K T P R H H T F F E M L G N F S F G
- - - - - - - - - - - - T F F E M L G N F S F -
------------------------------------TATTCCTCCGAGGTGTTTTGCCTCGACGCCTTC---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D Y F K E E A I E W A W E F L T Q V L G V P E E
- - - K E E A I E W A W E F L T - - - - - - - -
---------GAAGACCTTTACACCATCTTCCAGCTGTTTCATGGCTAT------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K L W V S V Y E E D E E A F R I W N E K I G L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E K R I L R M G K E D N F W G P A G P T G P C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P D T E I F Y D T G Y S K G C P E G E G C T P A
- D T E I F Y - - - - - - - - - - - - - - - - -
---GACCGCTTCGATTCTTCG---------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N S E G R F V E I W N L V F T E Y Y Q D E E G K
- - - - - - - E I W N L V F T - - - - - - - - -
---------------------TCCGCCACAGAGTTCTTTACTCAC---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L H P L P R K N I D T G A G L E R F C A M M Q G
- - - - - R K N I D T G A G L E R F C A M - - -
---------------CGTGAAAAGCGCAACAACTCCGGACTTTACCGCTTCTTCGTAGCTCGT---------
241242243244245246247248249250251252253254255256257258259260261262263264
V Y S N F D T D L F Q P I I K R I E E L T G V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y K T D E E K D V S I R V I A D H I R A I T F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I S E G V F P S N E G R G Y V L R R I I R R A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R H G I L L G M S E P F L Y R I V D A V V E K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G K V Y P E I V R G E G M V K E V L S A E E N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F L K T L E Q G M K V F D E I V E K K G K I D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E D A F R L Y D T Y G L P L E L T L E I A K E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G V E V D V Q E F N K Y M E E Q Q R K S R A A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G D V E F A R R Y E Y L E K L P K D F R T E F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G Y E K L E D E G E V V L V A R D D E T V E E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S E G T V E V V F S R T P F Y A E K G G Q V S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T G M V E W R D G K A L V E Y V F E A S E G V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V H R I K I L D G T L R R G Q K V I L R V D K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R R E A T M R N H T A T H L L H A A L K K V L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D H V R Q A G S L V A P D R L R F D F T H F K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L S S A E I E Q V E D L V N E W I M E A I P V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
V R Y T S Y E E A V K S G V V A L F T E K Y G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
V V R V V E V P G V S K E L C G G T H V K N T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
Q I G L F K I I S E E S V S S G V R R I E A V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G F S A L E L L R N Q K K L I D Q L K E I L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R E D E L T D R V L S L R E K V K E L E K K L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
Q G R I S E E R I A M K Q L E D G V K V F H G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
F E G V E A K H L G G I A D N V L K K E G E G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
V I L F S K F E N K V S L V V K V S E N L L G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
Y D A S S I A R N I A K E L G G N G G G R K N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863
A Q A G G R H P E R I K D V L E R L E E F L R
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_ala_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L S S S E I R Q Q F V D F F C K K H G H T N I
- - S S S E I R Q Q F V D F F C K K . G H T N I
------CCTCTTCAAGCCCGGCACATCGACCGTCAGGCCCTGCTCCTGGGCCAT---GAGCGTGATGTCGAT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A S S P V V P L N D P T L L F A N A G M N Q F K
A S . P V V P - - - - - - L F A N A G M N Q F K
GATGAC---GTAGGTGTCGTG------------------GCCGCTCACCTGCGTGCGCCCCTCGTCCTTCAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Y F L G T E K P P V V R V A N T Q K C I R A G
- - - - - - - - - - - V R V A N T Q K C I R A -
---------------------------------GCGCCGCAGGGTGCGCAGGAACGCCGCCTCTTCGTC---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G K H N D L D D V G R D T Y H H T F F E M L G N
- - - - - - - - - - - - - - - - T F F E M L G N
------------------------------------------------CGCGCCGAAGTGCTCCACCACCGT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
W S F G D Y F K K D A I A W A W E L L T E V W K
W S F - - - - K K D A I A W A W E L L T - - - -
GTCAACGAG------------CGGCTCGTTCGTGCCGAGCACCTGGTACCCGTACCGCTC------------
121122123124125126127128129130131132133134135136137138139140141142143144
L D P T R L H V T V F E G D P A N G I P R D D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A A G F W K A V G V P E E R I H L G N K K D N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
W E M G N T G P C G P C T E I H I D R T P D K S
- - - - - - - - - - - C T E I H I - - - - - - -
---------------------------------CGGGGTGAACACGTCCGT---------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G G P L V N G G T D K V I E I W N L V F I Q F N
- - - - - - - - - - - - - E I W N L V F I - - -
---------------------------------------GTCGACGTGCTGGGCGGGCAGCGG---------
217218219220221222223224225226227228229230231232233234235236237238239240
R N E D Q S L T P L P A Q H V D T G M G F E R I
- - - - - - - - - - - A Q H V D T G M G F E R I
---------------------------------CAGGTTCCAGATCTCGATGACCTTGTCCGTGCCGCCGTT
241242243244245246247248249250251252253254255256257258259260261262263264
C S V V Q G K S S N Y D T D V F T P L F E A I Q
C S V - - - - - - - - - - - - - - - - - - - - -
CACCAGCGG---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K V T L C D R P Y G G D L N D L K D T A Y R V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A D H I R T L T F A L T D G A T I G N V G R D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V L K R I L R R A E R Y G Y Q V L G T N E P F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y R L V D T V V E H F G A A F P E L K K N P H K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V K D Q I R D E E A A F L R T L R R G I T L F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R I A A Q M K D E G R T Q V S G K E A F K L H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T Y G V I I D I T L Q M A Q E Q G L T V D V P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436
L K R R
- - - -
------------
Class II
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_ala_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q Y L S G N E I R Q K F L E F Y S Q R G H Q I
- - - - S G N E I R Q K F L E F Y S Q R G H Q I
------------AGTGGTAACGAAATTCGGCAAAAGTTTTTAGAATTCTATTCCCAGCGAGGACATCAGATC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A S A S L V P E D P T V L L T I A G M L P F K
L A . A S L V P - - - - - L L T I A G M L P F K
CTCGCT---GCATCCCTCGTGCCA---------------TTACTGACGATCGCGGGGATGTTACCATTTAAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P I F L G Q R S P E F K R A T S S Q K C I R T N
- - - - - - - - P . . . R A T S S Q K C I R T -
------------------------CCT---------CGCGCTACGTCATCTCAAAAGTGTATCCGCACC---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D I E N V G R T A R H H T F F E M L G N F S F G
- - - - - - - - - - - - T F F E M L G N F S F -
------------------------------------ACTTTTTTTGAGATGCTAGGAAATTTCAGCTTT---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D Y F K E Q A I A W G W E I S T T V F G L P P E
- - - K E Q A I A W G W E I S T - - - - - - - -
---------AAAGAACAAGCGATCGCTTGGGGATGGGAAATATCGACA------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R L V A S V F E S D D E A Y A I W R D K I G V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E A R I K R M G E D D N F W Y S G P T G P C G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
C S E I Y Y D F H P E R G D A N I D L E D D T R
C S E I Y Y - - - - - - - - - - - - - - - - - -
TGCTCGGAAATATACTAC------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F I E F Y N L V F M Q Y N R D A E G N L T P L A
- - E F Y N L V F M - - - - - - - - - - - - - -
------GAGTTTTACAACTTGGTATTCATG------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K K N I D T G M G L E R M A Q I L Q K V P N N Y
K K N I D T G M G L E R M A Q I - - - - - - - -
AAGAAAAATATCGATACGGGAATGGGACTGGAACGGATGGCGCAGATC------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E T D L I F P I I K T A A E I A G I D Y N N C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E K T K V S L K V I G D H I R A V M H M I A D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I R A S N T G R G Y V L R R L I R R V V R H G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L I G V Y R R D V T C N V F T P E V V E T A I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L S E S A Y P N V R V R E A Q I K A E L Q R E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S Q F L K T L E R G E K L L D E I I E I A K Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K Q T Q I S G E S A F T L Y D T Y G F P L E L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q E V A E E Y N L T V D V D S F E V E M E K Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E R A K E A H E T I D L T V Q G S L D K L A E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I H A T E F V G Y T Q P V A T A E I K V L L M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G Q C V E E A E A G Q D V Q I V L D K T P F Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E S G G Q I G D R G Y L S G D A I L V R I E D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K K E S D F F V H F G R I E R G T L R V G D K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
T A Q I D R A C R R R A Q A N H S A T H L L Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A L K K I V D D S I S Q A G S L V D F T K L R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D F N C P R P V T P D E L Q Q I E E T I N T W I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
A E A H T A E I S I L P L A E A K A R G A V A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
F G E K Y G E E V R V L D F P G V S M E L C G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
T H V S N T A E I G V F K I I S E A G V A S G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
R R I E A V A G S A V L D Y L N V R D K V V K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L S D R F K V K P E E L P D R I T T L Q T E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
N T Q K Q L D T L K A Q L A L A K S E S L L A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
A E S V G E F K Y V V A Q M E A V D P E S L K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A A E R L L Q K L G N G A V V L G S V P E E G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V S L V A A F S P E V N K K G L Q A G K F I G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
I A K I C G G G G G G R P N L A Q A G G R D A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882
K L P E A L E T A L S E L R S A L S
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_ala_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K S K E I R N K W L N F F E S K G H L I I P S
- K S K E I R N K W L N F F E S K G H L I I P .
---AATGATTCCTTTTTCTTTTAAAAGTTCAAATAAATCTTCTGCTTTTTCAATTTTCTTATCGATACT---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K S L I P I K D D S L L W I N S G V A T L K D F
K S L I P - - - - - - L W I N S G V A T L K - -
TTGCGAAAGAATATT------------------TTTATATTTTTCAAAAATTATATTAGAGATGTC------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F S G K K I P P S K R L T N S Q K S I R T N D I
- - - - - - - - - K R L T N S Q K S I R T - - -
---------------------------GAAAAATTTACCCTTACTAATTTCAGAACCTAAAAT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E N V G K T A R H H T F F E M L G N F S I G D Y
- - - - - - - - - - T F F E M L G N F S I - - -
------------------------------TAAAGATTGTAAAGAAGCCATTTTTAAATTCAT---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F K K E A I N F G F E F I F D V L K F D R E K I
- K K E A I N F G F E F I F - - - - - - - - - -
---TTCAGTGTTTTTAAATTTCATAATGCTAAAATCAGACTC------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F F T Y F S E D L E T L E I L K S L N V P D S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I I K G S R K T N F W D M G N G P C G P N L E I
- - - - - - - - - - - - - - - - - - - - N L E I
------------------------------------------------------------ATTTTCTAAAAC
169170171172173174175176177178179180181182183184185186187188189190191192
F Y D R G P K Y S N R G I E L L K N D I E N D R
F Y - - - - - - - - - - - - - - - - - - - - - -
TAATTT------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y I E I W N I V F S Q F N N D G N G N Y E L L K
- - E I W N I V F S - - - - - - - - - - - - - -
------ATTTTTTCCTTTTGAATCTAAAGA------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q K N I D T G A G L E R L A C I L Q D T P T N F
Q K N I D T G A G L E R L A C I - - - - - - - -
TGTACCACCACATAAATCAGCTGTTATTTTTGGGAAATTAACAATTCT------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E T D L F L P I I K E I E K L S I Y K Y K I D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y F L K D K I Q E K I N L N F K I I S D H L R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A V N A I N D G A K P S N N G R G Y I I R R L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R R A Y R S G I F L G I K G K S F L H K M T Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V R D S L I Y D I D V E K V S K I I K K E E E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F S K T I S E G I N L L K E K I K S K F P K D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S I D I E N K S Q V A K Y F K E N N L T F D F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I A F E L F S T F G F P V E I I K E I L E D E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E I E L D I S N L P K Y L E E H A N K S R S E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S S A M Q K V I N S L E L V K E K V S E F V G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S T L K T K S K I L Y L L N E T E E I H F T N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E N E I S Y L I L D K T P F Y A T A G G Q R H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K G L L I Q D K N R I E V L E V F K D K H L N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V H K V K G K I L K S E L I N A E V D S N I R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G L E R N H S G T H L V F N A L S R E F G K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E Q L G S D N N E E R L T F D F P L S K K P S W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E E I K N V E K R V N E Y I N M S V D R E Y I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
T T L E G A K K L N A V M T L E E Q E Y M D P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E V R I V N F P K I T A D L C G G T H I E N T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
K I E T F K I I S L D S K G K N K F R I K A I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S K K I V E E Y L K D E I S K N K L V L E N L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
E K N K S L F Q G Y K M N F S W S K N L D E Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E Q I T K H I D Q A R S D Y K K L L K N S E N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L E K L E S D F S I M K F K N T E I I F D M N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K M A S L Q S L V A T L R E K N P K A I V I L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
S E I S K G K F F I C V G S K E F S A K D I S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
I I F E K Y K G K G G G N N I L S Q G S I D K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905
I E K A E D L F E L L K E K G I I
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_ala_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T L N K L R K K Y I D F F K S K K H F E I M G
- T L N K L R K K Y I D F F K S K K H F E I M .
---CTCATCAATCAAAATAGCTTTTATTCTTCTTATACCTGAAGATGAGGATTGTTCTTTTTGTATTTT---
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K S L V P E N D P T V L F N T A G M Q P L I P Y
K S L V P - - - - - - L F N T A G M Q P L I - -
AGTACCAAGTTCATT------------------GCCTCCACAAACTTCAAGCGAAAATCCATCTAT------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L L G E V H P S G D M L V N V Q K C L R T G D I
- - - - - - - - - D M L V N V Q K C L R T - - -
---------------------------TCCAAAAAGAGCCATAGCACCTTTTTCTCGAGCTTC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D E V G D L S H L T F F E M L G N W S L G A Y F
- - - - - - - - - T F F E M L G N W S L - - - -
---------------------------ATTTTTTATCTGTAAATTAACAATCTCTTCAAC------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K E Y S V K C S F E F L T S S D Y L N I P K D S
K E Y S V K C S F E F L T - - - - - - - - - - -
ATCATCCGTCATCTTTTCAGAATGAACAAAATCAAACCT---------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L Y V S V F E G D Q E I P R D T E T A K V W E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L G I S K D R I H Y L S K D H N F W G P V G S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G P C G P D T E I Y V D T G K S K C S L D C N I
- - - - - D T E I Y V - - - - - - - - - - - - -
---------------AAAACCCAACTTATCAAC---------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T C S C G K Y F E I W N N V F M Q Y N K D E N G
- - - - - - - - E I W N N V F M - - - - - - - -
------------------------TAGTTTAAAAGCAATATCACCAGG------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N Y I E L G R K C V D T G M G L E R T I A F L Q
- - - - - - R K C V D T G M G L E R T I A F - -
------------------TTGCTCTCCTTGAGATAAAGTTTTAAAAAACTTTTCTTCTTCTTTGCT------
241242243244245246247248249250251252253254255256257258259260261262263264
G K S S V Y D T D A F M P I I K R I E Y I S G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I Y G Q K E D D D R C I R I I S D H V K A A C F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I L A D S S V V F P S N L G Q G Y V L R R L I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R S I R Y A K K L G I K S H F L A D L V D S V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A I Y R S F Y N E L T E K K D F I K K E L S K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E E K F F K T L S Q G E Q E F I K I T R N L P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K T I P G D I A F K L Y D T Y G F P Y E V T E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L A I E Y G F N V D K L G F N E H F K K H Q K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S K K G G D K V F K G G L A D Y T Y E T T K L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T A T H L L H K A L Q L V L G D H V R Q K G S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I T A E R L R F D F V H S E K M T D D E I K K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E E I V N L Q I K N S L S V K K I I M E L S E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R E K G A M A L F G E K Y D D L V S V Y E I D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F S L E V C G G P H V E N T N E L G T F K I Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594
E Q S S S S G I R R I K A I L I D E
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_ala_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M C S S N I R Q K F V D F F K Q K D H H H V K A
- C S S N I R Q K F V D F F K Q K D H H H V K A
---TAATATATATTTCTCTAATATGTGGCGAGCTGTAACTAGTACTTGGTTTATTCCGCTGGCATCATTTCC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A P I V N K E D P T L L F T N A G M N Q F K D F
. P I V N - - - - - - L F T N A G M N Q F K - -
---TGCTGTAGCAAA------------------GCCTCCTTGAATAAGAGTTGCTAACTCTTTAAT------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F L N Q Q E A P Y Q R A I S T Q P C L R V S G K
- - - - - - - - - Q R A I S T Q P C L R V - - -
---------------------------TAACTCTTCAGAAATAAATAATGCGATATGTGGCTG---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H N D L E E V G V D T Y H H T M F E M L G N W S
- - - - - - - - - - - - - - T M F E M L G N W S
------------------------------------------AAAGCTAAGAGCTACTTGTTTAAGTGCTTC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F G E Y F K E E A I A C A W E L L T E V Y K L P
F - - - - K E E A I A C A W E L L T - - - - - -
TAC------------TACTTCTTCAATAAGTACTTGAATTTCTTGAACTTGCTT------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q E R L Y V T V F Q G D E E E S L E L D Q E S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N T W E K Y I S R D R I L Y G N K K D N F W E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G D T G P C G P C S E I H V D I R T E E E I Q Q
- - - - - - - - C S E I H V - - - - - - - - - -
------------------------TGCATCGGCAGTAATGGC------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q A G K E L V N T G H P Q V I E I W N L V F I Q
- - - - - - - - - - - - - - - E I W N L V F I -
---------------------------------------------TGCATGCGTACCTCCACAAAGTTC---
217218219220221222223224225226227228229230231232233234235236237238239240
Y N R L A S G Q L M E L P A K H V D T G M G F E
- - - - - - - - - - - - - A K H V D T G M G F E
---------------------------------------TCCATATTTCTCTCCAAACAACGCTGTGACACC
241242243244245246247248249250251252253254255256257258259260261262263264
R L T M V L Q G K S S T Y D T D I F V P L I H N
R L T M V - - - - - - - - - - - - - - - - - - -
CATTGACTTAGCATC---------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I M R L S H K T Y G K D N K V D I A M R V V A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H I R A I T F A I A D G Q L P S N T Q A G Y V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R R I L R R A V R Y G Y T N L G F E T P F M Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L V S I L A Q Q F K N V Y P Q I K Q Q Q S Y I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q V I K S E E E S F F K T L A V G L H R L E H I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S E T L N I N G Q Q V I D G P T A F E L Y D T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G F P P D L T R L I A Q E K G L E V D E E G F Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K A L Q N Q R I R S Q Q A A V L E Q G D W H I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V K D V D S V F I G Y D Q L E L I A K V I Q Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S I Y Q K G E E I Y Q I V L D Q T P F Y P E G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G Q V G D T G T L I V G E Q I I A V F D T K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y E R I I H Y T H E L P H D L H A T V Q A V V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V K K R N L I A S N H S A T H L L H A A L R Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L G S H I E Q K G S L V N E K L L R F D F P H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
T K V S P E Q I R E I E H I V N Q K I R A N I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L H E V R S M L L E D A K S M G V T A L F G E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y G E Y V R V I T F D P Y F S K E L C G G T H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S A T G K L G F F K I T A E T G I A A G T R R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E A I T A D A A E N F I I E Q L S I L N Q A T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A L K K P N D L V K S I Y H L L E E K A N L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
K I L S Y Q A Q E V R S V I D N L Y Q H I K Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
Q E I Q V L I E E V K V P N V E A L K Q V A L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
F R T N K G P F F L T L T S I I D Q Q P H I A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
F I S E E L I H K T Q M N A N I I I K E L A T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
I Q G G G G G Q P F F A T A K G N D A S G I N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878
V L V T A R H I L E K Y I L
- - - - - - - - - - - - - -
------------------------------------------
Class II
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_ala_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K L K A S E I R Q K Y L D F F V E K G H M V
- - - - K A S E I R Q K Y L D F F V E K G H M V
------------AATGTAATCTTTAATAAAGCTTAATGATTTTGAGATATTTTCAGGTTGTGTACCGCCACC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E P S A P L V P I D D D T L L W I N S G V A T L
E P . A P L V P - - - - - - L W I N S G V A T L
TTGAGC---ATCTGGACGACCGCC------------------TGGTGCCATTTGTTTGATAAGATCACCGGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K K Y F D G R E T P K K P R I V N S Q K A I R T
K - - - - - - - - - - - P R I V N S Q K A I R T
TTT---------------------------------AACCATCGATACTTTATCATCAACATTACTTGCAAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N D I E N V G F T A R H H T F F E M L G N F S I
- - - - - - - - - - - - - T F F E M L G N F S I
---------------------------------------CATTGTCGAGCGAATTGCTTTCGCATTTGGTAC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G D Y F K Q E A I E F A W E F L T S D K W M G M
- - - - K Q E A I E F A W E F L T - - - - - - -
------------AACCAATACTTTATAGCCATTGATTTCTTCAACTTGATC---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E P D K L Y V T I H P E D M E A Y N I W H K D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G L E E S R I I R I E G N F W D I G E G P S G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N T E I F Y D R G E A Y G Q D D P A E E M Y P G
N T E I F Y - - - - - - - - - - - - - - - - - -
TTCTAAATATAAGAAAGC------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G E N E R Y L E V W N L V F S E F N H N K D H S
- - - - - - - E V W N L V F S - - - - - - - - -
---------------------AATTTCAGAAGTATTGCGGACATG---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y T P L P N K N I D T G M G L E R M A S V S Q N
- - - - - N K N I D T G M G L E R M A S V - - -
---------------TACACGCACAACATCACCATATTTTTCACCGAATAATGCCATTGCGCC---------
241242243244245246247248249250251252253254255256257258259260261262263264
V R T N Y E T D L F M P I M N E I E K V S G K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y L V N N E Q D V A F K V I A D H I R T I A F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I S D G A L P A N E G R G Y V L R R L L R R A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R F S Q T L G I N E P F M Y K L V D I V A D I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E P Y Y P N V K E K A D F I K R V I K S E E E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F H E T L E D G L A I L N E L I K K A K A T T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I N G K D A F K L Y D T Y G F P I E L T E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A V Q A G L K V D M T T F E S E M Q Q Q R D R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R Q A R Q N S Q S M Q V Q S E V L K N I T S A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T F V G Y D T A T A Q T T L T H L I Y N G E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S Q V E A G E T V Y F M L T E T P F Y A V S G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q V A D T G I V Y N D N F E I A V S E V T K A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
N G Q N L H K G V V Q F G Q V N V G A T V S A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V N Q N D R R D I Q K N H S A T H L L H A A L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
S V L G D H V N Q A G S L V E A D R L R F D F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
H F G P M T N D E I D Q V E R L V N E E I W K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
I D V N I Q E M D I V S A K E M G A M A L F G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K Y G D V V R V V N M A P F S I E L C G G I H V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
R N T S E I G L F K I V S E S G T G A G V R R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
E A L T G K A A F L Y L E D I Q E K F N T M K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Q L K V K S D N Q V V D K L T Q L Q D E E K A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L K Q L E Q R D K E I T S L K M G N I E D Q V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E I N G Y K V L V T E V D V P N A K A I R S T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
D D F K S K L Q D T I I I L A S N V D D K V S M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
V A T V P K S L T N N V K A G D L I K Q M A P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
V G G K G G G R P D M A Q G G G T Q P E N I S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876
S L S F I K D Y I K N L
- - - - - - - - - - - -
------------------------------------
Class II
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_ala_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S F T E W P V S R V R Q E F V D Y F K K Q G H
- - - - - - P V S R V R Q E F V D Y F K K Q G H
------------------CCTGTGAGTAGGGTTCGCCAGGAGTTCGTCGACTACTTCAAGAAGCAGGGCCAC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T F V P S S P V C P H D D P T L L F I N A G M N
T F V P S . P V C P - - - - - - L F I N A G M N
ACATTTGTGCCCAGC---CCTGTCTGCCCG------------------CTGTTCATCAATGCCGGCATGAAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q F K A L F L G T A D P N T D F G R L K R A A N
Q F K - - - - - - - - - - - - - - - - K R A A N
CAGTTCAAG------------------------------------------------AAGCGCGCTGCCAAC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S Q M C I R A G G K H N D L E D V G R D T Y H H
S Q M C I R A - - - - - - - - - - - - - - - - -
TCGCAGATGTGCATTCGCGCT---------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T F F E M L G S W S F G D Y F K K E A I Q W A W
T F F E M L G S W S F - - - - K K E A I Q W A W
ACCTTTTTCGAGATGCTAGGATCATGGTCCTTT------------AAGAAAGAGGCCATCCAGTGGGCCTGG
121122123124125126127128129130131132133134135136137138139140141142143144
E L L T E V Y K L P K D Q L Y V T Y F E G D E N
E L L T - - - - - - - - - - - - - - - - - - - -
GAGCTCCTGACA------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N G L D P D L E A K E L W G Q F L P E S Q I V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G N A K D N F W E M G D T G P C G P C S E V H F
- - - - - - - - - - - - - - - - - - C S E V H F
------------------------------------------------------TGCTCGGAGGTTCACTTT
193194195196197198199200201202203204205206207208209210211212213214215216
D R I G G R N A A S L V N K D D P M V V E I W N
- - - - - - - - - - - - - - - - - - - - E I W N
------------------------------------------------------------GAGATCTGGAAT
217218219220221222223224225226227228229230231232233234235236237238239240
L V F M Q F E R R A G G S L T P L P Q K H I D T
L V F M - - - - - - - - - - - - - - Q K H I D T
CTGGTGTTTATG------------------------------------------CAGAAGCACATAGACACC
241242243244245246247248249250251252253254255256257258259260261262263264
G M G L E R L T S I L Q G V K S N Y D T D A W I
G M G L E R L T S I - - - - - - - - - - - - - -
GGCATGGGTCTGGAGCGCCTCACTTCTATT------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P L F E A I Q T A T G Y P K S Y A E I R N D P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S D A L V A Y R V V A D H I R C L T S A V G D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V M P D S V G R G F V L R R I I R R A V R Y G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q F L G A K P G F F T Q L V D S V C T S L G P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F P H L K E P R N I Q R I K T V L A D E E Q S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A K T W E M G L K H F N H A V N E C R A N N S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V I S G S E A F V L H D R Y G F P V D L T C L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A E K D G M T V D L E G F N A E M K E S K V S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G R V A A T K T F I D A Y Q L E E L K T R G I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q T D D A A K Y V W E D S T G D L L A I F D K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
N S K F I S L L E P G N D L G A E G V G I I L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T T N F Y A E S G G Q V Y D T G R L V A A S D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V F E V K K V Y N V A G Y V V H V G N L S K D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A S S I P S S A V V Q L Q V D Y E R R L P I A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N H T T T H Q L N W V L R R V L G E K P D N F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E V Q Q K G S L V T D E M L R F D F S Y N T K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
S N E D L V R V E R L L N E K I Q A G L P V Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E E V P L E A A S K I N G L R H M F G E K Y P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P V S V I S I G T P I N E M L A N P E K E E W R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D Y A V E F C G G T H L K N L K E A E K A V I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S E E A L M K G V R R V V V A T K S E A D K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
K A G A V L K G Q Y D E L M K K E A T A T S V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A L S V L N K K V G D S C I P L V L K N E M R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
N I D A A I K R M N A T L K S Q A A E A R D K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
A E A G K A L G A S Y D A A A A P F L V H Q M T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
E F G A E R E A L Q A F S D G F T S T V S G P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
G V F L I G S D D E K A L A I V S M P A A F V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
R K M S A V A W A K S S I G K G G G K P N A A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
S G L P A K D V A A A A A K A M E E A E R M K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962
S L
- -
------
Class II
Eukaryotes/Dictyostelium discoideum/amino acid sequences/Ddiscoideum_ala_aa
Eukaryotes/Dictyostelium discoideum/nucleotide sequences/Ddiscoideum_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D V N Q I R K T F I D F F R E K C E H T F V P
- D V N Q I R K T F I D F F R E K . E H T F V P
---GTTTGCATTTGCAAATTCTCTTGAAACGAGAATAGCTTCATCGATTTT---TAATTTAGAACCAACACC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S S A V I P H D D P T L L F A N A G M N Q F K P
S . A V I P - - - - - - L F A N A G M N Q F K -
TTG---AACATCAACTTT------------------TAAAACTTCGGTAACCTTTACAACCCAAGCATT---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I F L G Q V N P K S E Q A K L K R A V N S Q K C
- - - - - - - - - - - - - - L . R A V N S Q K C
------------------------------------------AAT---AGTAACTTTACCTTTTTCTTCATC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I R A G G K H N D L D D V G K D T Y H H T F F E
I R A - - - - - - - - - - - - - - - - - T F F E
TGGACTAAT---------------------------------------------------AGTGATTAAAGG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M L G N W S F G N Y F K K E A I T W A W E L L T
M L G N W S F - - - - K K E A I T W A W E L L T
AGTATTTGAATTGAAGTTTAC------------AACCTTTGGTTGAGATTTAGCCAATTCTTCAGAGGTTTT
121122123124125126127128129130131132133134135136137138139140141142143144
E V Y K L D K E R L Y V T Y F R G D P E K G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A D L E A K N L W L Q Y L P E E R V L P F G M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E N F W E M G D Q G P C G P C S E I H Y D K V E
- - - - - - - - - - - - - - C S E I H Y - - - -
------------------------------------------GAGGGCATTATTGAATCT------------
193194195196197198199200201202203204205206207208209210211212213214215216
G R D G A S F V N A D D P T L I E I W N L V F I
- - - - - - - - - - - - - - - - E I W N L V F I
------------------------------------------------GATACGACGTACACCAGCACCCAA
217218219220221222223224225226227228229230231232233234235236237238239240
Q Y N R E A D K S L R P L P Q K H V D T G M G L
- - - - - - - - - - - - - - Q K H V D T G M G L
------------------------------------------GTTTGACAAATGTGTACCACCACAAAATTC
241242243244245246247248249250251252253254255256257258259260261262263264
E R L T S I I Q K V P T N Y D T D V F M P I F A
E R L T S I - - - - - - - - - - - - - - - - - -
GATGGAATAGTTTGCCCA------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A I Q E V T G Y P E P Y G G K V G A E D T Q Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D M A Y R V I A D H I R T L T F S I A D G A A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S V D G R G Q V L R R I L R R A V R Y G K Q K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N A P A G F F S K L V D V V I A N F G E F F P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L R K K P E H I K M V L T R E E D M F N K T L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K G I V E F E K M I K K S V N N T L S A E N A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F L S T C Y G F P I D L T T I M A E E K N Y K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D I K G Y E G L C E A Q S E I D R K R Q K E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V E L T L G A E A N A W L K N N D I K P T D D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
F K Y K Q H E I Q S V I K A I W N G K E F V D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A P K G T L I G V V L E N S N F Y A E Q G G Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y D I G Q L S F I D D Q K T A F D V K D C K V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G G Y V L H I G Y L S Y E C D S L K V G D R V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L T V D Y T R R S P I M S N H T S T H M V N Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L K N I L G D G I D Q R G S F V D A Q R F R F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
F S F G R A I T K D E L I K I D Q I V N D Q I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
K Q L D V H A K E V G L A S A K K I N G L R A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
F G E V Y P D P V R V V S V G V P V E Q L I E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
P T N P E W A N Y S I E F C G G T H L S N T K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
A E L F T I T S E E T L G A G V R R I V A V T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
S E A A S A I E L N K E L E V R F N N A L K L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
G S E L A K E I V S L L D L L K V V T I S A S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
R M N L V E T L K E V Q A L Q R K Q V K E Q E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
I L A Q Q A Q T Y L E K T S E E L A K S Q P K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
F V D L V N F N S N T P L I T E T I K K I Q T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
S P M T A I M L I S P D E E K G K V T C I G I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
P K D S E I S K T L T A N A W V V K V T E V L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
G K G G G K V D V A Q G V G S K L D K I D E A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946
L V S R E F A N A N
- - - - - - - - - -
------------------------------
Class II
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_ala_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A S E I R E K F L S F Y E S R G H T R M Q G A
M A S E I R E K F L S F Y E S R G H T R M Q . A
ATGGCGTCAGAGATTCGGGAGAAATTCCTAAGCTTCTATGAGAGCAGGGGGCACACGCGCATGCAG---GCA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S L I P A D P T V L L T I A G M L Q F K P V F L
S L I P - - - - - L L T I A G M L Q F K - - - -
TCCCTCATACCA---------------CTGCTTACCATCGCCGGCATGCTGCAATTCAAG------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G Q A P R S V P R A T T T Q K C V R V S D I E N
- - - - R . . . R A T T T Q K C V R V - - - - -
------------CGC---------AGAGCCACTACCACGCAGAAGTGCGTGCGGGTC---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I G V T A R H H T F F E M L G N F S F G D Y F K
- - - - - - - - T F F E M L G N F S F - - - - K
------------------------ACCTTCTTTGAGATGCTGGGCAACTTCAGCTTT------------AAG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E A I Q M A W E L S T K V L G I P A Q R I W V
A E A I Q M A W E L S T - - - - - - - - - - - -
GCGGAGGCCATCCAGATGGCGTGGGAGCTGTCGACC------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S V Y K D D E E A A A L W R D G V G F P A E R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V R L G D E D N F W A S G P T G P C G P C S E L
- - - - - - - - - - - - - - - - - - - - C S E L
------------------------------------------------------------TGTTCAGAGCTG
169170171172173174175176177178179180181182183184185186187188189190191192
Y Y D F H P E R G T V G A S L E D D S R F I E F
Y Y - - - - - - - - - - - - - - - - - - - - E F
TACTAT------------------------------------------------------------GAGTTC
193194195196197198199200201202203204205206207208209210211212213214215216
Y N L V F M E S N R G P D G K L T P L A N K N I
Y N L V F M - - - - - - - - - - - - - - N K N I
TACAACCTCGTCTTCATG------------------------------------------AACAAGAACATT
217218219220221222223224225226227228229230231232233234235236237238239240
D T G M G L E R V A Q I L Q C V P N N Y E T D L
D T G M G L E R V A Q I - - - - - - - - - - - -
GACACTGGCATGGGGTTGGAGCGTGTTGCACAGATC------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I F P I V A A A G K L A G L D Y H S A S P G E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T A L K V M G D H A R A V V Y M V S D G V S P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N I G R G Y V L R R L I R R T I M K G R L L G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K E V M L P A L A E T V I G L S D G C D P A V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q N S Q R I I A E L A R E E E K F A S T L E A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G F P C P S Y A D F L C M S G S L D Q F L L W G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D G S T A T V S G A A A F E L Y D T Y G F P L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I T Q E M A A E R D I Q V D A A G F E A E M A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q K S R S R E A V R S I D M T A G H A L G D L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Q Q L G R T S F I G Y E H G P L R V P G S V L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I L R G G S S V E S A S A G D E V E V I L D R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P F Y A E S G G Q V G D R G C L T G V A S S S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
N N G A A S S S G S G L E L R V R D T Q K A G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G A L V V H H G S I E R G D L H V G Q M V M A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V D T S S R Q G A R K H H T A T H L L Q S A L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q V L K E E G E I S Q Q G S M V T A D R L R F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
F N L H R G L K E A E V A R V E E L V N G W V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
E D T A L T T R E M P L A E A K A A G A V A M F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
G E K Y N D A A V R V V E V P G A S M E L C G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
T H V E R T A Q I G A F K I V S E A G I A S G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
R R I E A V V G P A A V Q Y L N Q V D G I V R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
L A S Q L K I K S E E I P G R V A A L A E E A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S A Q K E V A K L R A E L A L A K S A A L A D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
A A T T A S G A R V V V S R L D G I D N K A L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E A A K G L Q E R L G D D S A V A L M G V S E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
G K V A I V V A L G G G A V K K G L K A G A I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G N L A K L C G G G G G G R P N L A T A G G K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907
P A G L P A A L E A A E T Q L M E Q L
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_ala_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I S S S V S N S N R P M T G A E I R E A F L D
- - - - - - - - - - - - - T G A E I R E A F L D
---------------------------------------TTTAGCAATCTTAAGAGCACTTTCAAAACTTTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F F A K R G H Q R M A S A L L I P D D S T V L L
F F A K R G H Q R M A . A L L I P - - - - - L L
TAAATTACGCCCACCAGCTTGTGCCAAATTCGC---TCCACCACCACCACC---------------AATGTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T I A G M L P F K P I F L G R E Q P P A L S A T
T I A G M L P F K - - - - - - - - - - - L S A T
ATTGACAACTTTTCCAGCATTTAATCC---------------------------------AAAACTAACTTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S S Q K C I R T N D I E N V G K T A R H H T F F
S S Q K C I R T - - - - - - - - - - - - - T F F
ACCCTCCTCCAATATACTGCCTAA---------------------------------------CTTTGCTGC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E M L G N F S F G N Y F K E Q A I I W A W E L S
E M L G N F S F - - - - K E Q A I I W A W E L S
TGTACTTAATAATGCAGCCTGTAC------------TGATACTAATATCTGAAAATCACCTACAAGTTCTAC
121122123124125126127128129130131132133134135136137138139140141142143144
T E V F G L D P A N L V V S I F Q E D N E A A L
T - - - - - - - - - - - - - - - - - - - - - - -
TTG---------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I W Q N L I G V N P K R I I R M G A K D N F W A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S G P I G P C G P C S E I Y Y D F H P D L G H D
- - - - - - - - - C S E I Y Y - - - - - - - - -
---------------------------AAGATAGGGAAGGACAGC---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D I N L E D D S R F I E F Y N L V F M E S N C D
- - - - - - - - - - - E F Y N L V F M - - - - -
---------------------------------TTTGAACAAACCAATCTCTCCTGT---------------
217218219220221222223224225226227228229230231232233234235236237238239240
S Q G N L T P L E N K N I D T G M G L E R M A Q
- - - - - - - - - N K N I D T G M G L E R M A Q
---------------------------AGGGATATTCACAACTCGTACGTAAGCTCCATATTTTTCACCAAA
241242243244245246247248249250251252253254255256257258259260261262263264
I L Q K K S N N Y E T D L I F P L I K K A A S L
I - - - - - - - - - - - - - - - - - - - - - - -
CAT---------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A G I D Y S E V N E K G K I S L K V I G D H S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A I S Q L I C D G V S A S N L G R G Y I L R R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L R R V V R H G R L L G I N D H F L V A M G E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S I E L M S K A Y P Q L E E K R D I I L N E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q E E A R F L E T L E R G E K L L S D I L K S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N Q Q I S G E Q A F E L Y D T Y G F P L E L T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E I T Q E H G R T V D V A G F E V A M K A Q R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R A K E A I V T I D P T L R S T I E G I A E S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K P T L F F G Y E V L D R S C Q V V A L I V K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E L V Q E A S T G D V V K V I L D G T P F Y G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S G G Q V G D R G M L L G S E T E K T S L I V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I E N V S R N Q G L F I H S G R I K K G T L R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G D L V I A K V D T H L R R R A Q A H H T A T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L L Q S A L K Q L V D A S I S Q A G S L V D F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R L R F D F S Y P G A I S L E K L E K I E N L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
N D W I N E I H R V E V T E M K L E Q A K V N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A I A M F G E K Y G A Y V R V V N I P N V S M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
L C G G T H V S N T G E I G L F K I I S E T G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
A S G I R R I E A I A G T A V L P Y L N D R D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
L V K E L G D H F K A P P S E V M V R V I A L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
D E L K T T N K A L L T A R S E L I S A K S A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
L A S Q V E L V G D F Q I L V S S F T G V Q A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
L L S T A A K Q L Q E Q L G D N T A V L L G S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
L E E G K V S F V A A F G K D V V Q R G L N A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
K V V N H I A K L C G G G G G G R A N L A Q A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
G R N L K S F E S A L K I A K S E L V S L L I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891
S P L
- - -
---------
Class II
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_ala_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V E Y T V K K L K R A F F S Y F K S K G H E I
- - - - T V K K L K R A F F S Y F K S K G H E I
------------TAGCTTAACATTTTTGTCAGTTTTAAAACTAAACTGCAATATTCCATTTTTCATTAAAAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I K S S S V I P S N D P S L L F T N S G M V Q F
I K S S . V I P - - - - - - L F T N S G M V Q F
AAATCCATCTTT---TTTATCACG------------------TTGTTTTACGTATCCATGAACAAAATCTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K N I L M G Q E T N L K R A C S I Q R C I R A G
K - - - - - - - - - - K R A C S I Q R C I R A -
ACA------------------------------CTTAAACAATTTGATAAAATTGCCTATGTTTTTTAA---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G K H N D L D D V G K D T Y H H T F F E M M G N
- - - - - - - - - - - - - - - - T F F E M M G N
------------------------------------------------TTGCTCATATTTTACAGGTGTATC
97 98 99 100101102103104105106107108109110111112113114115116117118119120
W S F G D Y F K K E A I E Y A W D F L V N I L K
W S F - - - - K K E A I E Y A W D F L V - - - -
CCGTGTCAC------------TTTTAAATTCTTTAAATTTTTTGTAAAATTTTCTTTCTT------------
121122123124125126127128129130131132133134135136137138139140141142143144
L E Q D R L Y V T Y Y K D M D S E S Y N I W K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F L P S E R I I E A D K N D N F W E M G D T G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
C G P C T E I H Y D R I G G R D A S R L V N Q D
- - - C T E I H Y - - - - - - - - - - - - - - -
---------AATTACTCGCCTAACATT---------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D P D V I E I W N I V F I E Y N R T P T G L E P
- - - - - E I W N I V F I - - - - - - - - - - -
---------------GTGACATCCACCACAAAGCTCTCT---------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L E R K C I D T G I G F E R L L S I L N N V K S
- - R K C I D T G I G F E R L L S I - - - - - -
------AACAATCGATGGATATTCTTCATTTTTCATATAAATTAAATTTTCTTC------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N Y L T N C F I P I I K N I E N M T D K K Y E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K L T I E D T A F R A V S D H C R T I A V C L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D N V E F S N E G Q G Y V L R R I L R R A V R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A H D I L K M Q R G D I G N L V K E I L K E M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L E I L E N D D G E I D H N L Y D T K I K K G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L D V N R E E D K F L E T L Q K G L E R F K K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S M N S Q I I S S E E I F R L Y D T Y G F P T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L V Q M L A E E H N V K L D F S K F E E C K E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A R E L S K K I N N E I T E I I L S D V S V T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D Q F K Y T E N G I S G R L Q F F T L E K K I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K F N V I N D D I S S S L E S I C N I S E N N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K F F N L P P E N T R I G M V F D R T C F Y S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S G G Q I G D T G L I T F Y E D N V E V G R F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V D D C K K V N G Y V L H Y G K L Q G K V T L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A N L E Y D D R S D I E R N H T G T H L F N Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L R K E I N T M Q R G S L V A K N K F R F D F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G H K I D L Q K V E D N I N L C I Q Q N L P V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
I K F M P K E D L L K E E N L I Y M K N E E Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S I V R M I C I G K L E N P E I R E L C G G C H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
V K N T G D L Y K L K I I S E S S I S S N V R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
V I G I T G N E V R K A E K K I E E I K L K V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
N G E V V H L D K S L P L F E R L R L E A K V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
E N I E V I T K A K K E N F T K N L K N L K M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
I A V T R D T P V K Y E Q K I L Y E Y Q T L D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
E T K K D I L K N I G N F I K L F K E D E D F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
L W G K C E D F V H G Y V K Q T N S E E I R D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
F K D G F F L M K N G I L Q F S F K T D K N V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892
L L F N
- - - -
------------
Class II
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_ala_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_ala_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
I E Q V I T C K Y L K K M S S E T N K I W T G D
- - - - - - - - - - - - - - - - - - - - - T G D
---------------------------------------------------------------ACAGGAGAT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E V R R Q F V K Y F E G L D H T F Y R S S P V I
E V R R Q F V K Y F E G L D H T F Y R S . P V I
GAGGTTCGAAGACAATTCGTGAAATACTTTGAGGGATTAGATCATACATTCTACAGATCT---CCAGTAATT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P L N D P T I L F I N A G M N Q F K S I F L G T
P - - - - - - L F I N A G M N Q F K - - - - - -
CCT------------------CTGTTTATTAATGCTGGAATGAATCAATTTAAG------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V E P N S E L S K L V R V A N S Q K C I R A G G
- - - - - - - - - L . R V A N S Q K C I R A - -
---------------------------TTG---AGAGTTGCAAATTCTCAAAAATGTATTAGAGCT------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K H N D L D D V G K D V Y H H T F F E M L G S W
- - - - - - - - - - - - - - - T F F E M L G S W
---------------------------------------------ACATTTTTTGAAATGTTAGGATCATGG
121122123124125126127128129130131132133134135136137138139140141142143144
S F G D Y F K E E A I E W A F K L L T Q V Y G I
S F - - - - K E E A I E W A F K L L T - - - - -
TCATTT------------AAAGAAGAAGCGATTGAATGGGCATTTAAACTTTTGACT---------------
145146147148149150151152153154155156157158159160161162163164165166167168
P K D R L Y A T Y F G G D P K L P S C P P D E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A K R I W L K Y L P E D R I L S C G S K E N F W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E M A D T G P C G P C S E I H Y D R I G G R D A
- - - - - - - - - - C S E I H Y - - - - - - - -
------------------------------TGTTCTGAAATACATTAT------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I S L V N K D D P D V I E I W N L V F M Q Y Y R
- - - - - - - - - - - - E I W N L V F M - - - -
------------------------------------GAAATTTGGAATCTTGTATTTATG------------
241242243244245246247248249250251252253254255256257258259260261262263264
E V D S T L T P L P K K C V D T G M G L E R L V
- - - - - - - - - - K K C V D T G M G L E R L V
------------------------------AAAAAATGTGTTGATACTGGTATGGGATTAGAAAGATTGGTT
265266267268269270271272273274275276277278279280281282283284285286287288
S I L Q N K T S N Y D I D L F K P I F D Q I H Q
S I - - - - - - - - - - - - - - - - - - - - - -
TCAATC------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V I S S S G V Q I P R Y S G K V G D I D D P E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I D M S Y R V I S D H I R T L T I A I A D G C I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P S N E G R G Y V L R R I L R R A I R Y G S Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L K A G S N G E P W F Y K L V D S V S N I M G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y Y K E I P E N I Q I I K E V I L D E E K Q F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K T L F K G T E R F N K V I N K L K S S Q N N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q D Q N K K L F P A S E A F Q L Y S T Y G F P M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D L T E L M A N E Q G F D F D R Q G F Q L C M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N H H L A S E G K N N K S F D D L I L K P D I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
N N L L L E F G L K E T D D Q Y K Y Q S Q T Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K D F Y S N L I A I F D G N Q L L N A T E I Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K V I G L I F D K T T F Y S E S G G Q V A D T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
F I D F Q Y N N N D E V S I F Q V I D C K K F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N Y V L H I G I L L Q G K I E I S P E L K S L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S V D Y S R R N L I K K N H T G T H I L N F A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
R Q I L G S T C D Q R G S V V D P N K L R F D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S S Q K P L T L D Q I E E I E K M I N Q I I Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
K Q T V Y C Q T V E L S I A K Q I P N I R A I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
G E T Y P D P V R V L S V S K S V D S L I N S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
T D N N D Q E K V S I E F C G G T H V E N T S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
I I S F S I I S E E G I A K G I R R I V A V T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
N Q S E I A I E N A K R L K Q E F K K L E E L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
G K E L E T L L N S F K S K L D E T K L L P L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
Y R R Q L S Q I I E E N Y K R V I A D A K K K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
K E R L N M A K E L A T K I G Q E Y S Q Q L S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
N N E F P A L I L N I K Q I Q G D S K S M D V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
G Q D I S K K Y P E A P I M L F T S G E F N D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
G V S V I S I M P K S K S D K L S S S N W L K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977978979980981982983984
T I E L C N G K C G G T D L R S V G S S K T G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
9859869879889899909919929939949959969979989991000100110021003
E S I E S M I Q L A L D L L K K N G I
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_asn_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L S I A E A S S E A H V G S E V S V R G W V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R I R S S G G V T F I V I R D S T G I V Q C T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K K N E L T P E Q Y D E I S S L G I E S S L S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I G T M K K E P R S P T G Y E I S I H K F T V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q K N D V F P I T K D Q G E E F L L D N R H L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L R S R E F T S I L K V R S T I F R S F A D F F
- - - - - - - - - - - V R S T I F R S F A D F F
---------------------------------GTCCGATCAACAATATTCAGATCTTTTGCTGACTTCTTT
145146147148149150151152153154155156157158159160161162163164165166167168
Y D Q G Y Y Q V H T P F M V S T A V E G G S T L
Y D Q G Y Y Q V H T P F M V - - - - - - - - - -
TACGATCAGGGATATTACCAGGTTCATACTCCTTTCATGGTC------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F K V D F F G E P I F L N Q S A Q F Y L E T M I
- - - - - - - - - - F L N Q S A Q F Y L E - - -
------------------------------TTTCTAAATCAAAGTGCGCAGTTCTACTTGGAA---------
193194195196197198199200201202203204205206207208209210211212213214215216
Y S L E K V F T I A P S F R A E K S R T R R H L
- - - E K V F T I A P S F R A - - - - - - - - -
---------GAAAAGGTATTCACAATAGCACCGAGCTTTAGAGCT---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T E Y W H A E A E V A W I D N R E M M D V E E N
T E Y W H A E A E V A - - - N R E M M D V E E N
ACTGAATACTGGCATGCGGAAGCAGAAGTAGCA---------AATAGAGAAATGATGGATGTAGAGGAAAAC
241242243244245246247248249250251252253254255256257258259260261262263264
M I Y Y I I Q R V I E E N Y D D L K L L G R D P
M I Y - - - - - - - - - - - - - - - - - - - - -
ATGATATAT---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E A L R A M K P P F P R V K Y S D I I K V A N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I G M Q L K Y G D D L G A D E E R Q I T M R Y C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K P V F V T N Y P K E L K P F Y M P Q D P D N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S E V L N H D L L A P E G Y G E I I G G S Q R I
- - - - N H D L L A - - - - - E I I G G S Q R -
------------AACCACGACCTGCTTGCA---------------GAAATTATAGGCGGAAGCCAAAGG---
361362363364365366367368369370371372373374375376377378379380381382383384
W D Y K E L M Q R I R E A G L D E S A Y Y W Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D L R K Y G S V P H S G F G L G M D R L A M W I
- - - - - - - V P H S G F G L G M D R L A M W -
---------------------GTGCCGCATTCAGGGTTTGGACTTGGTATGGACAGGCTAGCAATGTGG---
409410411412413414415416417418419420421422423424425426427428429
M H L D N I R E A I P Y P R T I R R T K P
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_asn_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P I H P S V T E L E K L V I D K E S Y K R M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E E W L K Y S W R W A V N E K Y K L V F K V Q A
- - - - - - - - - - - - - - - - - - - - - V Q A
---------------------------------------------------------------GTCCAAGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S I L R A L R E F L D S K G F V E V L S P I I G
S I L R A L R E F L D S K G F V E V L S P I I G
TCTATTCTGAGGGCGTTGCGAGAGTTTCTCGATTCCAAAGGCTTTGTGGAAGTGCTGTCTCCCATTATAGGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P V T D P G I R G A K Q A S I D F Y G A E Y K V
- - - - - - - - - - - - - - - - - - - - - - K V
------------------------------------------------------------------AAGGTT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M S S A I L Y K Q Y M A R V L G K I Y F V S P N
M S S A I L Y K Q - - - - - - G K I Y F V S P N
ATGTCTTCCGCCATTCTCTACAAGCAG------------------GGCAAGATCTACTTCGTCAGCCCAAAC
121122123124125126127128129130131132133134135136137138139140141142143144
I R L E P P D S I F T G R H L V E F Y Q L D L E
I R L - - - - - - - - - - - - V E F Y Q L D L E
ATTAGGCTG------------------------------------GTGGAGTTCTACCAATTAGACTTGGAG
145146147148149150151152153154155156157158159160161162163164165166167168
M Y K A T Y H E A M D L A E D L I T Y V V K Y V
M Y - - - Y H E A M D L A E D L I T - - - - - -
ATGTAC---------TACCATGAGGCAATGGACTTGGCAGAGGACCTCATAACT------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K D V H G K E L E A V L G R Q L Y E F K R P F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R Y S H K E A V E F V N K L G C E N S P R E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R W E C E K V M S A H H D S P F F V Y D Y P R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S R G F Y D R E D P E R P G V L R D F D M L Y P
- - - - - - - - - - - - - - - - - D F D M L Y -
---------------------------------------------------GACTTCGACATGTTATAC---
265266267268269270271272273274275276277278279280281282283284285286287288
E G F G E A I S G A E R E F E P E R L V E R I R
- - - - E A I S G A E R - - - - - - - - - - - -
------------GAGGCTATAAGCGGGGCTGAGAGG------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E G G E D P A K Y Q W F L Q M A K E L Y P L Q T
- - - - - - - - - - - - - - - - - - - - - L Q T
---------------------------------------------------------------CTACAGACC
313314315316317318319320321322323324325326327328329330331332333334335336
A G F G I G V E R L T R Y I C G L R A V W E A R
A G F G I G V E R L T R Y - - - - - - - - - - -
GCTGGGTTTGGGATTGGGGTGGAGAGGCTCACCAGATAT---------------------------------
337338339340341342343344345346347348
P Y P K V A G I I G G P
- - - - - - - - - - - -
------------------------------------
Class II
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_asn_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L S I A E V S T K A Y V G S K V S I R G W V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R I R S S G G V T F V V V R D S S G I I Q C T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R K N E L P E D V Y D T I S S L G I E S S V E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H G T L K E D R R S P S G Y E I A V D S F R V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q K N D V F P I T K D Q G E E F L L D N R H L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L R S R E F T S V L K I R S T I F R S F A D F F
- - - - - - - - - - - I R S T I F R S F A D F F
---------------------------------ATAAGATCGACCATATTCAGATCCTTCGCGGACTTCTTC
145146147148149150151152153154155156157158159160161162163164165166167168
Y E N G Y Y Q V Q T P F M V S T A V E G G S T L
Y E N G Y Y Q V Q T P F M V - - - - - - - - - -
TATGAGAACGGCTACTATCAGGTTCAGACGCCATTCATGGTT------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F K V D F F G E P I Y L N Q S A Q F Y L E T M I
- - - - - - - - - - Y L N Q S A Q F Y L E - - -
------------------------------TATCTCAATCAGAGCGCGCAGTTCTATCTTGAG---------
193194195196197198199200201202203204205206207208209210211212213214215216
Y S L E K V F T I A P S F R A E K S R T R R H L
- - - E K V F T I A P S F R A - - - - - - - - -
---------GAAAAGGTATTCACCATCGCACCGAGTTTTAGAGCT---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T E Y W H A E A E V A W I D N N E M M D I E E R
T E Y W H A E A E V A - - - N N E M M D I E E R
ACCGAATACTGGCATGCCGAGGCGGAGGTGGCC---------AACAATGAGATGATGGACATAGAGGAACGC
241242243244245246247248249250251252253254255256257258259260261262263264
M I Y Y I V S R V T E D N E D E L K M L N R D P
M I Y - - - - - - - - - - - - - - - - - - - - -
ATGATATAC---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E V L K A M K P P F P R I R Y S E I I K V A N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I G L P L K Y G D D L G A D E E R Q I T M K Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R P I F V T N Y P K D L K P F Y M P V D P E N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G E V L N H D M L A P E G Y G E I I G G S Q R I
- - - - N H D M L A - - - - - E I I G G S Q R -
------------AACCATGATATGCTTGCT---------------GAGATAATCGGAGGGAGCCAGAGA---
361362363364365366367368369370371372373374375376377378379380381382383384
W N Y D E L M Q R I R E A N L D E S A Y Y W Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D L R K Y G S V P H S G F G L G L D R L A M W I
- - - - - - - V P H S G F G L G L D R L A M W -
---------------------GTACCGCACTCTGGCTTCGGGCTTGGCCTGGACAGGCTTGCGATGTGG---
409410411412413414415416417418419420421422423424425426427428429
M H L D N I R E A I P Y P R T I R R T K P
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_asn_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S L Y L M Q I K G W V H K V R D L G K I K F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L I R D G Y K I M Q A V I K K G E S P D Y L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L D I P I E S A V E I E G E E R E T N G K K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L V K D L K I L A K A E P L P I D P K K A T P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K R F D Y R I I D L K L P E R Q T L F R L R A K
- - - - - - - - - - - - - - - - - - - - L R A K
------------------------------------------------------------TTAAGGGCCAAA
121122123124125126127128129130131132133134135136137138139140141142143144
V Q K F F R D W F M E N G F V E I N T P K I V I
V Q K F F R D W F M E N G F V E I N T P K I V -
GTACAAAAATTCTTTAGAGATTGGTTTATGGAAAATGGTTTTGTCGAAATAAATACTCCTAAAATAGTT---
145146147148149150151152153154155156157158159160161162163164165166167168
I G A E S G A E V F P V L Y F G K E A Y L T Q S
- - - - - - - - - - - - - - - - - - - Y L T Q S
---------------------------------------------------------TATTTAACACAATCT
169170171172173174175176177178179180181182183184185186187188189190191192
P Q L Y K Q M M V S V F P K V F E I A F A Y R A
P Q L Y K Q - - - - - - P K V F E I A F A Y R A
CCCCAATTGTATAAACAA------------------CCAAAGGTATTCGAAATTGCTTTCGCTTATAGGGCA
193194195196197198199200201202203204205206207208209210211212213214215216
E P S R T S R H L A E F T S V D A E M G F I K D
- - - - - - - - - A E F T S V D A E M G - - - -
---------------------------GCAGAATTCACTTCTGTAGATGCTGAAATGGGA------------
217218219220221222223224225226227228229230231232233234235236237238239240
E Y D V I N T I K K M L I D V S E K A M Q T K E
E Y D V I N T I K K M L I - - - - - - - - - - -
GAATATGATGTTATTAATACAATAAAGAAAATGTTAATC---------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F E E L A K P I D L G F E I I T F D E A K E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K G N P N E D L T T E E E R K L G E H F M E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V S F V A V T K Y P W S E R P F Y T M R L D D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P S Y T R G F D I I F R G L E I I S G A Q R E H
- - - - - G F D I I F - - - E I I S G A Q R - -
---------------GGTTTTGATATTATATTT---------GAAATAATAAGTGGGGCACAAAGA------
337338339340341342343344345346347348349350351352353354355356357358359360
R Y E K L L E N I K E K G I D P N K L E Y Y L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A F K Y G M P P H G G F G L G L E R Y L R Q L L
- - - - - - P P H G G F G L G L E R Y L R Q - -
------------------CCCCCTCATGGGGGATTTGGATTGGGATTAGAGAGGTATTTAAGACAA------
385386387388389390391392393394395396397398399400401402403404
G L D D V R E V I L F Y R D I D R L L P
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_asn_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E L P F Q Y I E E L P R Y V G Q T V T L K G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L Y N K R S S K G L H F L M L R D G T G L V Q C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V V A Q E K V D A D T W Q V A E E A T Q E C S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E V V G T V V R D E R Q I G G H E I H V E R L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R I G P S E N Y P I T P K P H G I E F L M D H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
H L W L R S R R P W A I M R I R N R V I R A I H
- - - - - - - - - - - - - - I R N R V I R A I H
------------------------------------------GCCCCACTGGAAATTCCGGGCCGACTCCTT
145146147148149150151152153154155156157158159160161162163164165166167168
D F F Q E R G F L Q L D A P I L T G N A V E G T
D F F Q E R G F L Q L D A P I L T - - - - - - -
CCAGAGCGGCAGGTTTTCCAGTTCTTTTTCGATCTCGTCCAGACGCTGGTT---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T T L F E I D Y F G D R A Y L S Q S G Q L Y A E
- - - - - - - - - - - - - Y L S Q S G Q L Y A E
---------------------------------------CCGTCGGTTTTCGGCCCGCTCGGCCTCCAGTTG
193194195196197198199200201202203204205206207208209210211212213214215216
A M A M A F G K V Y T F G P T F R A E K S K T R
- - - - - - G K V Y T F G P T F R A - - - - - -
------------------CGCTTCGATGCGGGCGTCGATCATCCGGGCCGTCTC------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R H L T E F W M I E P E M A F Y D L E M N M A L
- - - T E F W M I E P E M A - - - L E M N M A L
---------CGAGTAGGTCAGCCGCGGGAAGGGCGGCTGCAC---------CGCCGCAACGTCGCGTCCGAG
241242243244245246247248249250251252253254255256257258259260261262263264
A E E L V V H I V Q E V L R H C R T E L E V L G
A E E L V V - - - - - - - - - - - - - - - - - -
CACCTCCAGCTCCGTCCG------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R D V A A L E R V Q P P F P R L T Y S E A V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L R S D E T A R M I D A R I E A L K E E Q Q Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E A E R A E N R R R Y G Q A R K A E K R R I D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R E I E I N Q R L D E I E K E L E N L P L W K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S A R N F Q W G N D F G N S D E T V L T W H F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R P I I V H R F P A A I K A F Y M K R D P E D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R L A L G M D V L A P E G Y G E I I G G G Q R A
- - - - G M D V L A - - - - - E I I G G G Q R -
------------TATTTCATGGCCGCCGAT---------------CACAACGGTCCCCACCACCTCCAG---
433434435436437438439440441442443444445446447448449450451452453454455456
D D L A F L E A Q I E A H G L P R E A F E W Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D L R R Y G S V P H S G F G L G L E R T L A W I
- - - - - - - V P H S G F G L G L E R T L A W -
---------------------CAACATCAGAAAATGCAGTCCCTTCGAGCTTCGCTTGTTGTAGAGCCA---
481482483484485486487488489490491492493494495496497498499500501
C G V H H V R E V I P F P R L L G R L T P
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Archaea/Staphylothermus marinus/Smarinus_asn_aa
Archaea/Staphylothermus marinus/Smarinus_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V E N V V W Y H I E D V L S D D F I G K K V C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V R G W I Y R R S V V G G K A F V R V R G S T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I I Q V V V D R E K C G E E I V R I L K D I G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E A S V M T C G E L V K Q P R A P G G Y E V H A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D W F R I V G Y S R D F P I K G G E G I D Y L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D N R H L W I R S R K L T E I M K I K H S V L K
- - - - - - - - - - - - - - - - - I K H S V L K
---------------------------------------------------ATCAAGCACAGTGTTCTCAAA
145146147148149150151152153154155156157158159160161162163164165166167168
A G R E Y F V E N D W W E V T P P I L T A S A V
A G R E Y F V E N D W W E V T P P I L T - - - -
GCTGGGAGAGAATACTTTGTAGAGAATGATTGGTGGGAAGTAACACCCCCAATACTGACA------------
169170171172173174175176177178179180181182183184185186187188189190191192
E G G A T L F P V K Y F D K T A Y L S Q S A Q L
- - - - - - - - - - - - - - - - Y L S Q S A Q L
------------------------------------------------TATCTAAGCCAGAGCGCTCAACTA
193194195196197198199200201202203204205206207208209210211212213214215216
Y L E A L I Y S L E K V W S L T T S F R A E K S
Y L E - - - - - - E K V W S L T T S F R A - - -
TATCTTGAA------------------GAAAAAGTATGGAGCCTCACAACTAGTTTTAGAGCG---------
217218219220221222223224225226227228229230231232233234235236237238239240
R T R R H L A E Y W H L E A E A A W Y N M E D M
- - - - - - A E Y W H L E A E A A - - - M E D M
------------------GCAGAATACTGGCATTTAGAAGCAGAGGCTGCA---------ATGGAGGATATG
241242243244245246247248249250251252253254255256257258259260261262263264
M R V A E E L V A Y I V Q Y I L E H N K R Q L E
M R V A E E L V A - - - - - - - - - - - - - - -
ATGAGGGTAGCTGAAGAACTAGTAGCG---------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I L G R D L K I L K N S V E P P Y P R I R Y D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A I E I L Q K K G V N I E W G D D L G A D E E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V L T M E F D K P F F I T H F P K E I K S F Y M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K L D P E N E K L A L G F D L L A P E G Y G E I
- - - - - - - - - - - G F D L L A - - - - - E I
---------------------------------GGATTCGATCTCTTAGCG---------------GAAATT
361362363364365366367368369370371372373374375376377378379380381382383384
I G G S E R E D D Y N K L L N R I I E Q G Y D P
I G G S E R - - - - - - - - - - - - - - - - - -
ATAGGTGGGAGCGAGCGT------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E D Y K W Y L D L R K Y G S V P H S G F G L G I
- - - - - - - - - - - - - - V P H S G F G L G I
------------------------------------------GTACCCCATAGTGGTTTCGGCTTAGGAATC
409410411412413414415416417418419420421422423424425426427428429430431432
E R L V M W I A G L D H I R D A T P F P R F R G
E R L V M W - - - - - - - - - - - - - - - - - -
GAGAGACTAGTTATGTGG------------------------------------------------------
433434435436
R I Y P
- - - -
------------
Class II
Bacteria/Escherichia coli/amino acid sequences/Ecoli_asn_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S V V P V A D V L Q G R V A V D S E V T V R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W V R T R R D S K A G I S F L A V Y D G S C F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P V Q A V I N N S L P N Y N E D V L R L T T G C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S V I V T G K V V A S P G Q G Q Q F E I Q A S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V E V A G W V E D P D T Y P M A A K R H S I E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L R E V A H L R P R T N L I G A V A R V R H T L
- - - - - - - - - - - - - - - - - - - V R H T L
---------------------------------------------------------TTCAAACTTCCTGCC
145146147148149150151152153154155156157158159160161162163164165166167168
A Q A L H R F F N E Q G F F W V S T P L I T A S
A Q A L H R F F N E Q G F F W V S T P L I T - -
GCAGTTTTCGAGAATGGTCACTGCGTCGGTGTAATCCACCTGCGCGAAATCGGCCTCAATGAAGCG------
169170171172173174175176177178179180181182183184185186187188189190191192
D T E G A G E M F R V S T L D L E N L P R N D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G K V D F D K D F F G K E S F L T V S G Q L N G
- - - - - - - - - - - - - - F L T V S G Q L N G
------------------------------------------ATCGTTCAGGTTAGCAAACGCCACTTCCGG
217218219220221222223224225226227228229230231232233234235236237238239240
E T Y A C A L S K I Y T F G P T F R A E N S N T
E - - - - - - S K I Y T F G P T F R A - - - - -
CTC------------------CAGGTGACGGCTGGTGTTGGAGTTTTCAGCACGGAA---------------
241242243244245246247248249250251252253254255256257258259260261262263264
S R H L A E F W M L E P E V A F A N L N D I A G
- - - - A E F W M L E P E V A - - - L N D I A G
------------CAATGCGCAAGCGTAGGTTTCGCCGTTCAACTG---------GGTCAGGAAAGACTCTTT
265266267268269270271272273274275276277278279280281282283284285286287288
L A E A M L K Y V F K A V L E E R A D D M K F F
L A E A M L K - - - - - - - - - - - - - - - - -
ACCAAAGAAGTCTTTGTCGAA---------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A E R V D K D A V S R L E R F I E A D F A Q V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y T D A V T I L E N C G R K F E N P V Y W G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L S S E H E R Y L A E E H F K A P V V V K N Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K D I K A F Y M R L N E D G K T V A A M D V L A
- - - - - - - - - - - - - - - - - - A M D V L A
------------------------------------------------------TTGTTGCCCCTGGCCCGG
385386387388389390391392393394395396397398399400401402403404405406407408
P G I G E I I G G S Q R E E R L D V L D E R M L
- - - - E I I G G S Q R - - - - - - - - - - - -
------------TTTACCCGTCACAATGACCGAGCA------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E M G L N K E D Y W W Y R D L R R Y G T V P H S
- - - - - - - - - - - - - - - - - - - - V P H S
------------------------------------------------------------GAGGAAGGAGAT
433434435436437438439440441442443444445446447448449450451452453454455456
G F G L G F E R L I A Y V T G V Q N V R D V I P
G F G L G F E R L I A Y - - - - - - - - - - - -
GCCAGCTTTTGAATCTCGGCGGGTACGTACCCATCC------------------------------------
457458459460461462463464465466
F P R T P R N A S F
- - - - - - - - - -
------------------------------
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_asn_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S L L P T A T V A T I A R H V G Q R V T L A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W V Y H K T E K G K L I F I L L R D G S G T I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
C V T F K K N V S E A T F A T A Q A L T Q E S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
C R I T G S V R A D E R A P G G Y E L D V E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L V G P S H E Y P I T P K E H G V E F L M E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R H L W V R S A K Q H A I L R I R A E V I A A A
- - - - - - - - - - - - - - - I R A E V I A A A
---------------------------------------------CCATGGTAACGGATAGGCGCCTTCGAC
145146147148149150151152153154155156157158159160161162163164165166167168
Q E W L N E Q G F V R F D T P I L T A T A A E G
Q E W L N E Q G F V R F D T P I L T - - - - - -
TTCTCCCTGATGTGCAGCGATCAGCTCGATGGCCTGATCGTAGGTAATACGCGG------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T T N L F A T D Y F D L G K A Y L A Q T G Q L Y
- - - - - - - - - - - - - - - Y L A Q T G Q L Y
---------------------------------------------ACGCCGGTCGAGCACACGGGCAACAAT
193194195196197198199200201202203204205206207208209210211212213214215216
V E A G M M S F G K V Y C F G P T F R A E K S K
V E - - - - - - G K V Y C F G P T F R A - - - -
GGCGCT------------------CCGCATGTTATCTTCGTGATCGGCGAACGCCACTTC------------
217218219220221222223224225226227228229230231232233234235236237238239240
T R R H L T E F W M I E P E V A F A D H E D N M
- - - - - T E F W M I E P E V A - - - H E D N M
---------------GTGACGGCGTGTTTTGCTCTTCTCGGCGCGGAA---------GAAACAGTAGACTTT
241242243244245246247248249250251252253254255256257258259260261262263264
R L Q E Q F V S A I V A R V L D R R R E D L K V
R L Q E Q F V S - - - - - - - - - - - - - - - -
CCCGAACGACATCATCCCGGCTTC------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L E R D I S L L E Q V V P P F P R I T Y D Q A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E L I A A H Q G E V E G A Y P L P W G E D F G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P H E T L I A S K F D R P V F V E R F P S A V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A F Y M Q P D P N R P E V A L C A D L L A P E G
- - - - - - - - - - - - - - - C A D L L A - - -
---------------------------------------------CTCGTATCCGCCCGGGGC---------
361362363364365366367368369370371372373374375376377378379380381382383384
Y G E I I G G S Q R I H D P D L L E Q R I R A H
- - E I I G G S Q R - - - - - - - - - - - - - -
------TACACTACCGGTGATGCGACACGA------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G L R L E D Y Q W Y L D L R R Y G T V P H S G F
- - - - - - - - - - - - - - - - - - V P H S G F
------------------------------------------------------GAGAATAAAGATGAGTTT
409410411412413414415416417418419420421422423424425426427428429430431432
G M G I E R V V A W I T G T R H I R E T I P F P
G M G I E R V V A W - - - - - - - - - - - - - -
GCCTTTTTCCGTCTTGTGGTAGACCCATCC------------------------------------------
433434435436437438439440
R Q L Y R I Y P
- - - - - - - -
------------------------
Class II
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_asn_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A S A R I V D L L S Q G Q P G Q T V V V R G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I R T A R Q L K E F T F V E V N D G S C L K G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q V V L G Q E L A D Y E M L A K Q L D T G A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A V E G Q L V A S P A K G Q R V E L Q A A S V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I V G G A D P E Q Y P L Q K K R H S F E F L R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I A H L R P R T N S L G A V M R V R N A A A T A
- - - - - - - - - - - - - - - - V R N A A A T A
------------------------------------------------GTTCGCAATGCTGCGGCAACTGCG
145146147148149150151152153154155156157158159160161162163164165166167168
I H D F F Q E R G F L W V H T P I I T A S D C E
I H D F F Q E R G F L W V H T P I I T - - - - -
ATTCATGACTTCTTCCAAGAGCGCGGCTTCCTCTGGGTGCATACGCCGATTATCACG---------------
169170171172173174175176177178179180181182183184185186187188189190191192
G A G E L F T V T N L D L D K L G Q S Q Q A P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F E Q D F F G K R A Y L T V S G Q L E A E I M A
- - - - - - - - - - Y L T V S G Q L E A E - - -
------------------------------TATTTAACCGTCAGCGGCCAGCTCGAAGCCGAG---------
217218219220221222223224225226227228229230231232233234235236237238239240
L A F S N V Y T F G P T F R A E N S N T S R H L
- - - S N V Y T F G P T F R A - - - - - - - - -
---------AGCAACGTCTACACCTTTGGCCCGACTTTTCGCGCT---------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A E F W M V E P E M A F C D L G G D M D L A E A
A E F W M V E P E M A - - - L G G D M D L A E A
GCAGAGTTTTGGATGGTCGAGCCGGAGATGGCT---------CTTGGCGGCGACATGGACTTGGCCGAAGCC
265266267268269270271272273274275276277278279280281282283284285286287288
F L K F V F Q R V S D R C S E D L E F F N Q R I
F L K - - - - - - - - - - - - - - - - - - - - -
TTCTTGAAA---------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D S E V L N R A E T I L N N D F E R V S Y T D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I A L L E K A D R S F D Y P V A W G I D L Q S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H E R Y L A E E Y F R K P L I V Y D Y P R E I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A F Y M R L N D D Q K T V A A M D V L A P G I G
- - - - - - - - - - - - - - A M D V L A - - - -
------------------------------------------GCAATGGACGTGCTGGCA------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I I G G S Q R E E R L D V L K Q R L A E A N L
E I I G G S Q R - - - - - - - - - - - - - - - -
GAAATCATCGGCGGTTCTCAGCGG------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P E E N Y W W Y L D L R R Y G S V P H A G F G L
- - - - - - - - - - - - - - - - V P H A G F G L
------------------------------------------------GTTCCCCATGCCGGATTTGGCCTA
433434435436437438439440441442443444445446447448449450451452453454455456
G F E R L V Q F I T G M G N I R D V I P F P R T
G F E R L V Q F - - - - - - - - - - - - - - - -
GGCTTTGAGCGACTGGTGCAATTC------------------------------------------------
457458459460461462
P Q N A E F
- - - - - -
------------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_asn_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K I S R T K I V D L M K R E D F G A M V N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K G W V R T R R G S K Q V N F I A L N D G S T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N N V Q V V V D L A N F D E E M L K Q I T T G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
C L S V N G V L T E S V G A G Q K A E V Q A R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I E V L G T C D N T Y P L Q K K G H S M E F L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E I A H L R P R T N T F G A V F R I R H N M A I
- - - - - - - - - - - - - - - - - I R H N M A I
---------------------------------------------------CGGGAATTCGAATTTATGTCC
145146147148149150151152153154155156157158159160161162163164165166167168
A I H K F F H E K G F F Y F H T P I I T A S D C
A I H K F F H E K G F F Y F H T P I I T - - - -
TTTGGCAACAGCTTCTTCCAGTATTTTAATACCTTCCGTGTATGGCAGACGGACGAAGTC------------
169170171172173174175176177178179180181182183184185186187188189190191192
E G A G Q M F Q V T T M N L Y D L K K D A N G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I V Y D D D F F G K Q A S L T V S G Q L E G E L
- - - - - - - - - - - - S L T V S G Q L E G E -
------------------------------------AGCCAAATCCATATTCTCCTGAATTTCGTTGAA---
217218219220221222223224225226227228229230231232233234235236237238239240
A A T A L G A I Y T F G P T F R A E N S N T P R
- - - - - G A I Y T F G P T F R A - - - - - - -
---------------CATCCAAAACTCGGCCAAGTGACGCGGAGTGTTAGA---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H L A E F W M I E P E V A F N E I Q E N M D L A
- - A E F W M I E P E V A - - - I Q E N M D L A
------CGTATAGATTGCACCTAAAGCGGTAGCAGCTAA---------CAACTGTCCCGAAACAGTCAAACT
265266267268269270271272273274275276277278279280281282283284285286287288
E E F I K Y C V R W A L D N C A D D V K F L N D
E E F I K - - - - - - - - - - - - - - - - - - -
GGCTTGTTTGCCAAA---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
M F D K G L I E R L E G V L K E D F V R L P Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E G I K I L E E A V A K G H K F E F P V Y W G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D L A S E H E R Y L V E D H F K R P V I L T D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P K E I K A F Y M K Q N E D G K T V R A M D V L
- - - - - - - - - - - - - - - - - - - A M D V L
---------------------------------------------------------CTTCTGTCCGGCGCC
385386387388389390391392393394395396397398399400401402403404405406407408
F P K I G E I I G G S E R E S D Y N K L M T R I
F - - - - E I I G G S E R - - - - - - - - - - -
TAC------------CACACCGTTCACGCTCAGACAAGC---------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E E M H I P M K D M W W Y L D T R K F G T C P H
- - - - - - - - - - - - - - - - - - - - - C P H
---------------------------------------------------------------AAAGTTAAC
433434435436437438439440441442443444445446447448449450451452453454455456
S G F G L G F E R L L L F V T G M S N I R D V I
S G F G L G F E R L L L F - - - - - - - - - - -
TTGTTTGCTGCCTCTGCGGGTGCGAACCCATCCTTTCAC---------------------------------
457458459460461462463464465466467
P F P R T P R N A D F
- - - - - - - - - - -
---------------------------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_asn_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A L L P S M Y I R D S A D H V G E A V K L A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W V Y H K T E K G K L V F I Q L R D G T A T I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
C V V F K K N V S E E V F A R A K E L T Q E S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
C Y I H G T L R A D E R S S L G F E L D V T D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E I V H L T Q N Y P I T P K E H G T Q F L M E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R H L W V R S A K Q H A L L R I R A Q V I A A A
- - - - - - - - - - - - - - - I R A Q V I A A A
---------------------------------------------CCATTCCAAATCGGCTAATGGTGCATT
145146147148149150151152153154155156157158159160161162163164165166167168
Q E Y L N S E H F V R Y D S P I L T A T A A E G
Q E Y L N S E H F V R Y D S P I L T - - - - - -
ATCGGGAGCAACAGTTGCCCCTGCCGCCACACCTTGCTTGATTTTTTCAATCGC------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T S D L F A T E Y F D L G N A Y L A Q T G Q L Y
- - - - - - - - - - - - - - - Y L A Q T G Q L Y
---------------------------------------------TAAAATTTTGAGATCTTCTTCGCAGCG
193194195196197198199200201202203204205206207208209210211212213214215216
V E S G M A T F G R V Y C F G P T F R A E K S K
V E - - - - - - G R V Y C F G P T F R A - - - -
ATCAAG------------------GGAAACGAAATTTTCTTGCAATTCCATATTATCGTC------------
217218219220221222223224225226227228229230231232233234235236237238239240
T R R H L T E F W M I E P E F A F A D Q D D N M
- - - - - T E F W M I E P E F A - - - Q D D N M
---------------GATCATCCAAAATTCGGTCAGGTGGCGACGAGT---------TTCAGCCCGAAAAGT
241242243244245246247248249250251252253254255256257258259260261262263264
E L Q E N F V S Y I V Q R V L D R C E E D L K I
E L Q E N F V S - - - - - - - - - - - - - - - -
GGGGCCAAAACAATAAACCCGACC------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L E R D T S K L E N I V P P F P R I S Y D E A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E K I K Q G V A A G A T V A P D N A P L A D L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
W G D D F G A P H E T Y L A S L F D K P L F I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N Y P T K V K A F Y M Q P A E G R P E V V R C A
- - - - - - - - - - - - - - - - - - - - - - C A
------------------------------------------------------------------TTCAAA
361362363364365366367368369370371372373374375376377378379380381382383384
D L I A P E G Y G E I I G G S Q R I H D A E L L
D L I A - - - - - E I I G G S Q R - - - - - - -
ACCCAAGCTCGA---------------AAGTGTACCATGGATATAGCACGA---------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E A R I R E H G L D V A D Y Q W Y L D L R R Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S V P H S G F G M G I E R C V A W L A G T R H I
- V P H S G F G M G I E R C V A W - - - - - - -
---TTGAATAAAAACCAACTTGCCTTTTTCGGTTTTGTGATAGACCCAACC---------------------
433434435436437438439440441442443444445446447
R E A I P F P R Q L Y R I Y P
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_asn_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D K I S V S D A R R A E A V G R H V R L Q G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V R T R R D S K G G F S F I E L N D G S C Q G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V Q V V A P G E L A N Y E S V V K H L H T G A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V R I D G E V K A S P A K G Q A T E V L A A S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L I G D A D V N T Y P L Q K K G H S F E F L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G I A H L R P R T N T L G A V A R V R H Q V S I
- - - - - - - - - - - - - - - - - V R H Q V S I
---------------------------------------------------CGGGTACTCCCACGTCTTGCC
145146147148149150151152153154155156157158159160161162163164165166167168
S I H Q F F H E R G F Y Y V H T P V I T A S D C
S I H Q F F H E R G F Y Y V H T P V I T - - - -
GCTCTTCAGCAGGATGTCCACGCCCTCCGTGTACGACACCCGCTTGAACCCGTTGTTGAG------------
169170171172173174175176177178179180181182183184185186187188189190191192
E G A G A M F R V S T I D P E A P P K A E G K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D Y K Q D F F G K P A Y L T V S G Q L Q G E A F
- - - - - - - - - - - Y L T V S G Q L Q G E - -
---------------------------------CGCGAGGTCCATGTTGTCGGTGAGGTCGTAGAA------
217218219220221222223224225226227228229230231232233234235236237238239240
A C A L G K I Y T F G P T F R A E N S N T P R H
- - - - G K I Y T F G P T F R A - - - - - - - -
------------CATCCAGAACTCGGCGAGGTGCCGCGGGGTGTTCGA------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L A E F W M I E P E M A F Y D L T D N M D L A E
- A E F W M I E P E M A - - - L T D N M D L A E
---GGTGTAGATCTTCCCCAGCGCGCACGCGAACGC---------AAGTTGCCCGCTCACCGTCAGGTACGC
265266267268269270271272273274275276277278279280281282283284285286287288
A F L K R I I S D A M T Y C L E D L K F F A E K
A F L K - - - - - - - - - - - - - - - - - - - -
CGGCTTGCCGAA------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L E N N K G L F E K L E N V L N N G F K R V S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T E G V D I L L K S G K T W E Y P V A W G V D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q S E H E R Y L A E Q H F K C P V I L Y D Y P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T L K P F Y M K V N D D G K T V R A M D V L V P
- - - - - - - - - - - - - - - - - A M D V L V -
---------------------------------------------------CGTGGCCTGCCCCTTGGC---
385386387388389390391392393394395396397398399400401402403404405406407408
G V G E I I G G S Q R E E R L D V L E S R M R E
- - - E I I G G S Q R - - - - - - - - - - - - -
---------CACCTCGCCGTCGATGCGCACGCT---------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q G L P P E G Y E W Y L D L R R Y G T V P H S G
- - - - - - - - - - - - - - - - - - - V P H S G
---------------------------------------------------------TTCGATGAAGCTGAA
433434435436437438439440441442443444445446447448449450451452453454455456
F G L G L E R T I L F L S G M A N I R D V I P F
F G L G L E R T I L F - - - - - - - - - - - - -
CCCGCCCTTCGAGTCGCGCCGGGTGCGCACCCA---------------------------------------
457458459460461462463464465
P R T P G N A E Y
- - - - - - - - -
---------------------------
Class II
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_asn_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_asn_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K R R I I E I L R N G Q S D E S V T V Q G W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R T K R D L K G F A F V E V N D G S S L A S L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A V L K A E M P D Y E A T L K Q I N T G A S V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I S G V L V P S Q G K G Q R I E L Q A E T V K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F G D A D P E T Y P L Q K K R H S F E F L R T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G H L R S R T N S L G A V F R V R N A C A T A I
- - - - - - - - - - - - - - - V R N A C A T A I
---------------------------------------------CTCAACCGGATATTCAAAGGTTTTTGT
145146147148149150151152153154155156157158159160161162163164165166167168
H Q F F Q E R S F L W V H T P V I T R N D C E G
H Q F F Q E R S F L W V H T P V I T - - - - - -
GGCTTTTTCTAACTGCGCGATCGCCTCTGTATAAGTAATTCGTTCAAATTGGTT------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A G E L F T V T S L D L K K I P Q T E N G K I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y S Q D F F G G Q A F L T V S G Q L E A E V M A
- - - - - - - - - - F L T V S G Q L E A E - - -
------------------------------TAAATCCATATTTCCCACTAAATCGCAAAAAGC---------
217218219220221222223224225226227228229230231232233234235236237238239240
M A F S N V Y T F G P T F R A E N S N T S R H L
- - - S N V Y T F G P T F R A - - - - - - - - -
---------CCAAAATTCTGCTAAATGTCGAGATGTATTAGAATT---------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A E F W M V E P E M A F C D L V G N M D L A E A
A E F W M V E P E M A - - - L V G N M D L A E A
GTAGACGTTGCTAAACGCCATCGCCATGACTTC---------TTGTCCGCTGACAGTTAAAAAAGCTTGTCC
265266267268269270271272273274275276277278279280281282283284285286287288
F L K H I F K Y V L E T C P E D M K F F N Q R I
F L K - - - - - - - - - - - - - - - - - - - - -
GCCAAAAAA---------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D D S V L A T A D N I I N N Q F E R I T Y T E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I A Q L E K A T K T F E Y P V E W G L D L Q S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H E R Y L A E E L F K K P V I V T D Y P K Q I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A F Y M R V N D D D K T V R A M D V L A P K I G
- - - - - - - - - - - - - - A M D V L A - - - -
------------------------------------------CAATTCAATTCTTTGCCC------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I I G G S Q R E E R L E V L E K R M Q A Q D I
E I I G G S Q R - - - - - - - - - - - - - - - -
AGGCACTAGCACCCCGCTAATTTC------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N P D D L W W Y L D L R R Y G T V P H A G F G L
- - - - - - - - - - - - - - - - V P H A G F G L
------------------------------------------------GTTCACTTCTACAAACGCAAACCC
433434435436437438439440441442443444445446447448449450451452453454455456
G F E R L V Q F M T G M G N I R D V I P F P R A
G F E R L V Q F - - - - - - - - - - - - - - - -
TTTTAAATCGCGTTTGGTGCGTAC------------------------------------------------
457458459460461462
P L S A E F
- - - - - -
------------------
Class II
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_asn_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T S I K H L L I N A K K Y D Q K E F E I K A W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V A S N R G N T N I R F V E I N D G S T I K N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q V V I K K E I M S F L E V D K I R L G A A I H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V K G V L K Y T P G M A Q E I E L N A D K F I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K N T D E D F P I Q K K E T S L E A L R E I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
H L R H R T T T L R A I M L I R S T L A L E I H
- - - - - - - - - - - - - - I R S T L A L E I H
------------------------------------------ATTAGATCAACACTTGCTTTAGAAATTCAT
145146147148149150151152153154155156157158159160161162163164165166167168
K F Y N E R G Y L W V S S P I I T G N D G E G A
K F Y N E R G Y L W V S S P I I T - - - - - - -
AAATTTTACAATGAAAGAGGATATTTATGAGTATCTTCACCTATAATTACA---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G E S F V V D D E S K D F F F N K K A T L G V T
- - - - - - - - - - - - - - - - - - - T L G V T
---------------------------------------------------------ACATTAGGAGTTACT
193194195196197198199200201202203204205206207208209210211212213214215216
G Q L H A E A Y A L G F S K V Y T F A P T F R A
G Q L H A E - - - - - - S K V Y T F A P T F R A
GGACAATTGCATGCTGAA------------------AGTAAAGTTTATACTTTTGCCCCTACTTTTAGAGCT
217218219220221222223224225226227228229230231232233234235236237238239240
E N S N T T K H A A E F W M M E P E V A F F D L
- - - - - - - - - A E F W M M E P E V A - - - L
---------------------------GCTGAATTTTGAATGATGGAGCCGGAAGTAGCA---------TTA
241242243244245246247248249250251252253254255256257258259260261262263264
K D L I K M S D D M L R Q V I K R T V E A H P H
K D L I K M S D D M L R - - - - - - - - - - - -
AAAGATCTTATTAAAATGTCAGATGATATGTTAAGA------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E F E F F E K N K P G L L K N L N L F L N N K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S I L E Y R E A I K I L E K V K D R F E D K N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F F G K D L A T E H E K Y L A E K H I Q G P V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V I N Y P K S F K A F Y M F Q N E D N E T V A A
- - - - - - - - - - - - - - - - - - - - - - - A
---------------------------------------------------------------------GCT
361362363364365366367368369370371372373374375376377378379380381382383384
Y D L L V P G I G E V I G G S K R E T R Y E K L
Y D L L V - - - - E V I G G S K R - - - - - - -
TATGATTTACTTGTA------------GAAGTAATTGGTGGTTCTAAACGT---------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V Q R V K D L K I N Q E D L Q W Y L D L R R F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q A S S A G F G L G F E R L I M Y I T G T E N I
- A S S A G F G L G F E R L I M Y - - - - - - -
---GCTTCAAGTGCAGGTTTTGGTTTAGGTTTTGAAAGATTGATTATGTAC---------------------
433434435436437438439440441442443444445446447
R D T I P F P R T P K N M K M
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_asn_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F A S I K D I L K N P I L N S N V T I N G W I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R T K R S N G K I G F I E I N D G S T L K G I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A V I N E E E N Q F S E K D L K K L T T G T S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S L T G L L V E S P A K G Q N Y E I K T H S F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V I G E T D P E T Y P L Q K K R H S F E F L R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I P H L R I R T N T F G A I A R V R N K I S Y K
- - - - - - - - - - - - - - - - V R N K I S Y K
------------------------------------------------GTAAGAAACAAAATTTCATACAAA
145146147148149150151152153154155156157158159160161162163164165166167168
I H E Y F Q K N G F F Y I N T P I I T S N D G E
I H E Y F Q K N G F F Y I N T P I I T - - - - -
ATTCATGAATATTTCCAAAAAAATGGTTTTTTTTATATTAATACACCAATAATTACA---------------
169170171172173174175176177178179180181182183184185186187188189190191192
G A G E M F R V S T L K F N K L N N A L S N I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F K D D F F G K E A F L S V T G Q L H G E A Y A
- - - - - - - - - - F L S V T G Q L H G E - - -
------------------------------TTTCTCTCTGTCACTGGTCAATTGCATGGGGAA---------
217218219220221222223224225226227228229230231232233234235236237238239240
M A L S K I Y T F G P T F R A E N S N T T R H A
- - - S K I Y T F G P T F R A - - - - - - - - -
---------TCTAAAATATATACATTCGGACCAACATTTAGAGCA---------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S E F W M I E P E M A F Y K L N D N I A L A E D
S E F W M I E P E M A - - - L N D N I A L A E D
TCAGAATTTTGGATGATAGAACCAGAAATGGCT---------CTTAACGACAATATTGCCCTAGCAGAAGAT
265266267268269270271272273274275276277278279280281282283284285286287288
L L K Y L L S S I L N E C S Q D M D F L E N Y I
L L K - - - - - - - - - - - - - - - - - - - - -
CTCTTGAAA---------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E K G L I K K L E N V I N S N F E V I T Y T K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I E I L E N S K K N F E I K P Y W G I D L Q T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H E R Y L T E E T F K K P V V V I D Y P K N F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A F Y M K A N K D N K T V K G M D I L V P K I G
- - - - - - - - - - - - - - G M D I L V - - - -
------------------------------------------GGAATGGACATACTTGTT------------
385386387388389390391392393394395396397398399400401402403404405406407408
E I I G G S E R E D D L Q K L E N R I K E L N L
E I I G G S E R - - - - - - - - - - - - - - - -
GAGATTATAGGGGGAAGCGAAAGA------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N I E H L N W Y L D L R R F G S A P H S G F G L
- - - - - - - - - - - - - - - - A P H S G F G L
------------------------------------------------GCTCCTCATTCTGGCTTTGGACTT
433434435436437438439440441442443444445446447448449450451452453454455456
G L E R L V Q Y S T G I S N I R D S I P F P R T
G L E R L V Q Y - - - - - - - - - - - - - - - -
GGACTTGAAAGATTGGTGCAATAC------------------------------------------------
457458459460461462
P K N L Y F
- - - - - -
------------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_asn_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K R I K I K E L F I A N P V G T K V C I K G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V R T K R I S K Q V V F I M L N D G S T I H N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q I V T E P E K F A E D I M Q H I A T G V S L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V C G T V I A S Q G G N Q A I E L Q A D T I E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L G T A T D Y P L Q P K K H S L E F L R E I A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L R F R T N T F S A V F R I R H A I S Y A I H Q
- - - - - - - - - - - - - I R H A I S Y A I H Q
---------------------------------------GCCCCATTCATCAATAGGATAAGCAAACTTTTT
145146147148149150151152153154155156157158159160161162163164165166167168
F F H E Q G F V Y L H T P I I T A V D A E G A G
F F H E Q G F V Y L H T P I I T - - - - - - - -
CTCTTTATTAGGCTGAGAAGCTTTTAAAATATCAATTGCTTCTGTATA------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E M F S V T T L N M E Q L P K T P Q G Q V D F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R D F F G Q K T S L T V S G Q L E A E A A A L G
- - - - - - - - S L T V S G Q L E A E - - - - -
------------------------ATCATCTTTACAATGCTCTAATGCAAAACCAAT---------------
217218219220221222223224225226227228229230231232233234235236237238239240
L A E V Y T F G P T F R A E N S N T T R H L A E
- A E V Y T F G P T F R A - - - - - - - - - A E
---CTCTGCTAAAGCTATGTTATCAGCTAAATCATAAAA---------------------------CTCGGC
241242243244245246247248249250251252253254255256257258259260261262263264
F W M V E P E M A F Y D L A D N I A L A E R F L
F W M V E P E M A - - - L A D N I A L A E R F L
TAAGTGCCGGGTAGTGTTAGAGTTTTC---------AGTTGGACCAAATGTATATACTTCTGCCAAACCTAA
265266267268269270271272273274275276277278279280281282283284285286287288
K Y V I G F A L E H C K D D L E F L Q K R E L D
K - - - - - - - - - - - - - - - - - - - - - - -
GGC---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A R V G K Q T D K S F L P L L D R L D N I L T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P F A C I S Y T E A I D I L K A S Q P N K E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F A Y P I D E W G C D L Q S E H E R Y L V E K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F T K P V I I T N Y P R A I K A F Y M H Q Q E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G K T V A A M D I L F P G I G E I I G G S Q R E
- - - - - A M D I L F - - - - E I I G G S Q R -
---------------TAACTCTATGGCTTGGTT------------AGCTATAACAGTACCACAAACAGA---
409410411412413414415416417418419420421422423424425426427428429430431432
E R L D K L T E A I Q S M G M N S N I L Q W Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D T R L F G T V P H S G F G L G L E R L V Q F V
- - - - - - - V P H S G F G L G L E R L V Q F -
---------------------TAGCATTATAAAAACTACTTGCTTACTAATACGCTTGGTTCTTACCCA---
457458459460461462463464465466467468469470471472473474475476477
T G M D N I R D V I P F P R T P G N A A F
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_asn_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K T T I K Q A K D H L N Q D V T I G A W L T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K R S S G K I A F L Q L R D G T G F M Q G V V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K S E V D E E V F K L A K E I T Q E S S L Y V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G T I T E D N R S D L G Y E M Q V K S I E V I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E A H D Y P I T P K N H G T E F L M D H R H L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L R S K K Q H A V M K I R N E V I R A T Y E F F
- - - - - - - - - - - I R N E V I R A T Y E F F
---------------------------------AAAATCTTCGCCCCATTCAATATCATCAAAGCCTTCTGC
145146147148149150151152153154155156157158159160161162163164165166167168
N K D G F T K V D P P I L T A S A P E G T S E L
N K D G F T K V D P P I L T - - - - - - - - - -
TTTCAAGAACTCAATTGCATCATCATATGAAATTCTAGGGAA------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F H T K Y F D Q D A F L S Q S G Q L Y L E A A A
- - - - - - - - - - F L S Q S G Q L Y L E - - -
------------------------------ACAATTTTCTAAAACTGATTTTACTACATGTGT---------
193194195196197198199200201202203204205206207208209210211212213214215216
M A H G K V F S F G P T F R A E K S K T R R H L
- - - G K V F S F G P T F R A - - - - - - - - -
---------TTCTAAACTTTCAGCATGATTTGTGAAAGCCATTTC---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I E F W M I E G E M A F T N H A E S L E I Q E Q
I E F W M I E G E M A - - - H A E S L E I Q E Q
GTGTCTACGTGTTTTTGATTTTTCAGCTCTGAA---------AAATGAAAATACTTTTCCGTGTGCCATTGC
241242243244245246247248249250251252253254255256257258259260261262263264
Y V T H V V K S V L E N C K L E L K M L E R D T
Y V T - - - - - - - - - - - - - - - - - - - - -
CGCAGCTTC---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S K L E K V A T P F P R I S Y D D A I E F L K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E G F D D I E W G E D F G A P H E T A I A N H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D L P V F I T N Y P T K I K P F Y M Q P N P E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E E T V L C A D L I A P E G Y G E I I G G S E R
- - - - - C A D L I A - - - - - E I I G G S E R
---------------TTTCACTTGCATTTCGTA---------------ATTATCTTCTGTAATTGTGCCTGT
361362363364365366367368369370371372373374375376377378379380381382383384
V D D L E L L E Q R V K E H G L D E E A Y S Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L D L R R Y G S V P H C G F G L G L E R T V A W
- - - - - - - - V P H C G F G L G L E R T V A W
------------------------TCCATCACGTAATTGTAAAAAGGCGATTTTACCACTTGAACGTTTATT
409410411412413414415416417418419420421422423424425426427428429430
I S G V E H V R E T A P F P R L L N R L Y P
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_asn_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H A K A L A R L R M H H A A R Q R M F S V G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W R A L W V V A K L T M P E K E A P G W Q T T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q V N L A M I T E K P H A L A S P M M A S S V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P A V D E A P S F A T T S P P L A P G R G F T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L S C S V L V P V S L E P P L P A T S L P W R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R G L R T G T C A S S S S A L V L T A A S S L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S S L R Q H W S S C T T L S R C P F F S L A L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L C L L R H R R T L P P H H H H R S P R L P L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T P C R T I A I Q L H S V L L F K A S G S K G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R A E S E R T M E N E Q Q R T A A V A Q L K A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V G L D D R G A K D L S S K P E R V A D V L A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F A Q H S I D E A S P R E Q K V M L F N V W T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V K K P E H R D P V T A F I L D G K L D S T Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V D A A I R F V N A A G S D V V D T A A M L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
C G V G V T V S R E D V E K A V A A A L V A E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V A A L K T K W D K N P N M M L G Q M R R V A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L R W A D V E H V R A A L E R Q V P G L I K D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I V E A K P A A A K K E A A A M P K K E V E S C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R Q N S N F K D V A Q G L P R S P I G E L P S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K E G A C V Y V V G W A H R V R H Q S R M S F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V L R D G T G F I Q C V F D G S T E P F H R E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
C V A I R G T L R H E P K A K S E L Q P P M E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
H V N E Y A V V G D S D G T I E T V I T A E S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V D K L Y D Q R H V V V R G T L A S S V L K V R
- - - - - - - - - - - - - - - - - - - - - - V R
------------------------------------------------------------------GATGGC
577578579580581582583584585586587588589590591592593594595596597598599600
H E L L R V F R E H F W S H Q Y Y E V T P P T L
H E L L R V F R E H F W S H Q Y Y E V T P P T L
GGCGTCGACCTTCTGCGTGCTGTCGAGTTTGCCGTCAAGGATGAAGGCGGTCACGGGATCGCGGTGCTCAGG
601602603604605606607608609610611612613614615616617618619620621622623624
V Q T Q V E G G S T L F E V L Y Y G E K A Y L T
V - - - - - - - - - - - - - - - - - - - - Y L T
CTT------------------------------------------------------------GATGCTGTG
625626627628629630631632633634635636637638639640641642643644645646647648
Q S S Q L Y L E S V T A S L G N V Y C C M P S Y
Q S S Q L Y L E - - - - - - G N V Y C C M P S Y
CTGCGCGAAGAAGGCCAGCACATC------------------GCTGGACAGGTCTTTGGCGCCCCTGTCGTC
649650651652653654655656657658659660661662663664665666667668669670671672
R A E R S K T K R H L S E F T H L E A E Y D V C
R A - - - - - - - - - S E F T H L E A E Y D - -
AAGGCC---------------------------AGCGGTGCGCTGCTGCTCGTTCTCCATGGTGCG------
673674675676677678679680681682683684685686687688689690691692693694695696
S F E D L L N H L E G M F C T V I R T V I E R V
- F E D L L N H L E G M F C - - - - - - - - - -
---CGCCCGTGGGCCTTTCGAGCCCGATGCCTTAAAGAGTAA------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
G D L V A M L N P S Q L I D P N G N V R D P A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
Y K F T P K R P F R R L R Y A D A I Q F C N E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
G I L N T E T G K P F E F G E D I T D Q P E R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
M V A K L G E F V F M T H F P A S M K S F Y M Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810811812813814815816
R D P D D P T L T E S V D V L A P G I G E V L G
- - - - - - - - - - S V D V L A - - - - E V L G
------------------------------TGCAAGAGGCGGTGACGT------------GGGCGCCTCGTC
817818819820821822823824825826827828829830831832833834835836837838839840
G S M R M Y K Y D E L L D A Y K R E G L D A S T
G S M R - - - - - - - - - - - - - - - - - - - -
CACCGCCGGCCG------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
Y Y W Y T D Q R R Y G G A P H G G F G L G V E R
- - - - - - - - - - - - A P H G G F G L G V E R
------------------------------------CTTTTCGGGCATCGTCAGCTTCGCCACCACCCACAA
865866867868869870871872873874875876877878879880881882883884885886887888
L L V W M L N L D S V K D A C L Y P R Y M G R C
L L V W - - - - - - - - - - - - - - - - - - - -
CGCCCGCCACAT------------------------------------------------------------
889890
K P
- -
------
Class II
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_asn_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V Y E E V S L K N L K I K N D Y K S I E L S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I S K S D M H K R I K T F G W V D C C R T G K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I T F F D L T C Q F K S I K C V Y E K K I D L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K C T S L T I Y G T I Q E N K S K K E N A E F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V L V E K L E I F N D A I A P S F P L N K E S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F D T M M K Y G H L A L R N K Q R G F F L K A R
- - - - - - - - - - - - - - - - - - - - - - A R
------------------------------------------------------------------GTCGTC
145146147148149150151152153154155156157158159160161162163164165166167168
S S L L K I I R D I F Y E G N F I E I T P P T I
S S L L K I I R D I F Y E G N F I E I T P P T I
TTTTTTTACACCTTCATCATTCAAAAATTTGATAGCATCTACGTATCTTATTCTTTTAAATGGGCGTTTAGG
169170171172173174175176177178179180181182183184185186187188189190191192
V Q T Q V E G G S T L F K L K Y Y D K D A Y L T
V - - - - - - - - - - - - - - - - - - - - Y L T
GAC------------------------------------------------------------TCTTTTAAT
193194195196197198199200201202203204205206207208209210211212213214215216
Q S S Q L Y L E T V A P V A Y R A Y C I A S S Y
Q S S Q L Y L E - - - - - - Y R A Y C I A S S Y
AGATTCAGTAACCAAATGTTCAAT------------------AAATTCAATATTTGCTAATTCTGCTTCTAC
217218219220221222223224225226227228229230231232233234235236237238239240
R A E K S N T T R H L S E Y T H V E A E L A N I
R A - - - - - - - - - S E Y T H V E A E L A - -
ATGAGT---------------------------ACTTTTTTCTGCACGGTACGACGAAGCAATACA------
241242243244245246247248249250251252253254255256257258259260261262263264
E F E D L I N N I E H L V T E S I K R F Y D L L
- F E D L I N N I E H L V T - - - - - - - - - -
---GTAAGCTACAGGTGCAACTGTCTCCAAATAAAGTTGCGA------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G D E I K D L Y P E I K L Q N V P K R P F K R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R Y V D A I K F L N D E G V K K D D D T D F V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G D D I P D S R E K I I C E R F G K G E P V L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T H F L V E H K P F Y M K L D S S N E T C T E S
- - - - - - - - - - - - - - - - - - - - - - - S
---------------------------------------------------------------------TTT
361362363364365366367368369370371372373374375376377378379380381382383384
F D L L Y P G I G E I V G G S M R L D N Y N K L
F D L L Y - - - - E I V G G S M R - - - - - - -
CGATTTGTTCTCCTG------------AATAGTCAATGAAGTACATTTTGT---------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I D G F K R E G L N P E D Y D W Y L D M A R F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P C S H G G Y G L G F E R L L M A L M R Y T N I
- C S H G G Y G L G F E R L L M A - - - - - - -
---CCAGCCAAATGTTTTAATTCTTTTATGCATATCACTCTTAGAAATTTC---------------------
433434435436437438439440441442443444445446447
E F A T L Y P R N T R R C H P
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_asn_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I K P E K K F V T E Y S V T G R L R I A S I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D G E D G G V S Y I G K K V T V G G W A R T V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K Q C S D T L L F I S L N D G S T S S N L Q C V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V E K T V K G F E E G L K A T A G C S F K I T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T I V K S P A Q G Q S V E L L L N T G D D E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I C G L C D A S K Y P L A K K H H S K E F L R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V A H L R P R S Q F F S S V M R I R N S L A I A
- - - - - - - - - - - - - - - - I R N S L A I A
------------------------------------------------ATCAGAAATTCTCTTGCTATTGCA
169170171172173174175176177178179180181182183184185186187188189190191192
I H E Y F Q K N G F M Y I H T P I I T A A D C E
I H E Y F Q K N G F M Y I H T P I I T - - - - -
ATTCATGAATATTTCCAAAAGAACGGTTTTATGTACATTCACACTCCAATTATTACT---------------
193194195196197198199200201202203204205206207208209210211212213214215216
G A G E M F Q V T T V L P P E S K N N I S N I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A S K I E G S Q D M A V D Y K K D F F G K A S Y
- - - - - - - - - - - - - - - - - - - - - - - Y
---------------------------------------------------------------------TAT
241242243244245246247248249250251252253254255256257258259260261262263264
L T V S G Q L A L E N F A C S M S D V Y T F G P
L T V S G Q L A L E - - - - - - S D V Y T F G P
TTGACTGTTTCTGGACAACTTGCTTTAGAG------------------TCTGATGTTTATACATTTGGACCA
265266267268269270271272273274275276277278279280281282283284285286287288
T F R A E N S H T T R H L A E F W M I E P E M A
T F R A - - - - - - - - - A E F W M I E P E M A
ACTTTCAGAGCG---------------------------GCTGAATTTTGGATGATCGAGCCTGAAATGGCA
289290291292293294295296297298299300301302303304305306307308309310311312
F A D L S D N M K L G E G L L K Y T V E Y V L I
- - - L S D N M K L G E G L L K - - - - - - - -
---------CTTAGTGATAACATGAAACTTGGAGAAGGACTTCTTAAA------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N N M P D L L Y L D K N I E N G L V E R L K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
C K E E F A R I S Y T E A I E M L K P H D K E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T V P V S W G M D L G S E H E K Y I T D V L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R P C I I Y N Y P K D I K S F Y M K L N E D G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T V A A M D I L V P K I G E V I G G S Q R E D D
- - - A M D I L V - - - - E V I G G S Q R - - -
---------GCAATGGATATCCTAGTC------------GAGGTTATCGGTGGTTCTCAGAGA---------
433434435436437438439440441442443444445446447448449450451452453454455456
I E K L E N A I K S R N M D P A P Y W W Y N E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R K Y G S V P H S G F G L G F E R L I M M V T G
- - - - - V P H S G F G L G F E R L I M M - - -
---------------GTTCCACATTCAGGGTTTGGTTTAGGATTTGAAAGACTAATCATGATG---------
481482483484485486487488489490491492493494495496497498499
V E N V R D V I P F P R Y P N H C E F
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_asn_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_asn_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
Q V G Q S L R I G G W V K T G R G A G G G E W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F L E V N D G S C F N S M Q V A E A V G G F T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L T P S G T S V L L E G Q L V K A P E N A K Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V E L K V S K V V H V G A C D N S A G N Y A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K K K M T M E F L R G L M H L R P R T N T I G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V A R I R N A L A V A T H D F F Q S H G F L Y V
- - - I R N A L A V A T H D F F Q S H G F L Y V
---------ATACGCAACGCGCTGGCGGTTGCGACGCACGATTTCTTCCAGTCACATGGCTTCCTGTACGTG
145146147148149150151152153154155156157158159160161162163164165166167168
H T P L I T C S D C E G A G E I N C G A Q V T T
H T P L I T - - - - - - - - - - - - - - - - - -
CACACGCCACTCATCACC------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L S K A E Q A D K E P K V T E E E V Q A L E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N V S A Q G Q A V A A A K A A D K A L Q K A L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A E V N K L Q K A K A A L A A K K E R A E L Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R M V G G I E R L P D G R I D Y T G D F F A R P
- - - - G . E . . . . . . . . . . . . . . . . .
------------GGC---GAG---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S Y L T V S G Q M N A E Y Y A C A L S N V Y T F
. . . . . S G Q M N A E - - - - - - S N V Y T F
---------------TCCGGGCAGATGAATGCGGAG------------------TCCAACGTGTACACGTTC
289290291292293294295296297298299300301302303304305306307308309310311312
G P T F R R A L F F L L F C F C N S H T A R H L
G P T F R R - - - - - - - - - - - - - - - - - -
GGGCCCACCTTCAGGCGC------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A E F W M I E P E M A F A D L E D D M R C A E D
A E F W M I E P E M A - - - L E D D M R C A E D
GCGGAGTTCTGGATGATTGAGCCGGAAATGGCC---------CTGGAGGATGACATGCGTTGCGCTGAGGAC
337338339340341342343344345346347348349350351352353354355356357358359360
Y V Q H C C R H L L A T C M P D L E F I N K Q V
Y V Q - - - - - - - - - - - - - - - - - - - - -
TACGTGCAG---------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D S G A I A R L Q Q I A H T P F E R V T Y T R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I E I L E E V V K S K K K K F E F P V E W G I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L A S E H E R Y L T E E V F K K P V I V Y N Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S A I K A F Y M R Q N D D G K T V A A M D V L V
- - - - - - - - - - - - - - - - - - A M D V L V
------------------------------------------------------GCCATGGACGTGCTGGTT
457458459460461462463464465466467468469470471472473474475476477478479480
P K V G E L I G G S Q R E D R L E V L E A R L K
- - - - E L I G G S Q R - - - - - - - - - - - -
------------GAGCTCATCGGGGGGTCCCAGAGG------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E A G M P L E P Y S G Y L D L R R Y G S V P H S
- - - - - - - - - - - - - - - - - - - - V P H S
------------------------------------------------------------GTGCCCCACTCC
505506507508509510511512513514515516517518519520521522523524525526527528
G F G L G F E R L I L L A T G M D N I R E V I P
G F G L G F E R L I L L - - - - - - - - - - - -
GGATTTGGCCTGGGCTTTGAGCGCCTGATCCTGCTC------------------------------------
529530531532533534535536537538
F P R W P G H A E Y
- - - - - - - - - -
------------------------------
Class II
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_asp_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A I S L R S R I H V A E L L S K G E V G K E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T V A G W V D T V R A H G G I V F V V L R D R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G K I Q L V V K K N V S K D A W K T A K N L T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E S V I A A H G T L V E S K A A L G G R E L V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E L V V Y S K A D P L P I D I K D H S K T I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A K R L D W R F L D L R N P R N L L I F L V E A
- - - - - - - - - - - - - - - - - - - - - V E A
---------------------------------------------------------------GTCGAGGCA
145146147148149150151152153154155156157158159160161162163164165166167168
E M A R A A R E W F Y E H G F V E I F T S K I V
E M A R A A R E W F Y E H G F V E I F T S K I V
GAGATGGCTAGAGCGGCCCGCGAGTGGTTCTATGAGCATGGGTTCGTAGAGATATTCACCTCAAAGATAGTA
169170171172173174175176177178179180181182183184185186187188189190191192
G A A T E G G A E V F S I V Y F D K P A F L A Q
- - - - - - - - - - - - - - - - - - - - F L A Q
------------------------------------------------------------TTCCTAGCACAA
193194195196197198199200201202203204205206207208209210211212213214215216
S P Q L Y K Q M G V I A G F E R V F E I G P A F
S P Q L Y K Q - - - - - - - E R V F E I G P A F
TCTCCACAGCTTTACAAGCAG---------------------GAACGCGTATTTGAGATAGGACCTGCATTC
217218219220221222223224225226227228229230231232233234235236237238239240
R A E P H H T T R H L T E Y T S V D L E M G F I
R A - - - - - - - - - T E Y T S V D L E M G - -
CGTGCA---------------------------ACAGAATATACAAGTGTTGACCTAGAGATGGGA------
241242243244245246247248249250251252253254255256257258259260261262263264
D S F E D V M D A V E G V V R A M I R R A I S V
- - F E D V M D A V E G V V R - - - - - - - - -
------TTTGAGGATGTTATGGATGCTGTTGAGGGAGTAGTTCGT---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y G N Q I R E Y F P D A V L E E P K D I P R I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I R E A Y K L L E S A G V E V E W G D D L S S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G E R K L G E I I E R E Y G S P I V F V T E Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
W R A R P F Y T M K K P D D P E W T L S F D L L
- - - - - - - - - - - - - - - - - - - S F D L L
---------------------------------------------------------AGCTTCGACCTACTC
361362363364365366367368369370371372373374375376377378379380381382383384
F R G L E I A T G G Q R E H R Y E V L V K Q I E
F - - - E I A T G G Q R - - - - - - - - - - - -
TTC---------GAGATAGCTACTGGTGGTCAGCGT------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E K G L N P K N F E W Y L N M F R Y G A P P H G
- - - - - - - - - - - - - - - - - - - - P P H G
------------------------------------------------------------CCACCGCATGGA
409410411412413414415416417418419420421422423424425426427428429430431432
G A G I G L E R V A M Q L L G L G N I R E A R L
G A G I G L E R V A M Q - - - - - - - - - - - -
GGTGCAGGTATAGGCCTTGAGAGAGTTGCTATGCAG------------------------------------
433434435436437438439440441442
L P R D P E R L T P
- - - - - - - - - -
------------------------------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_asp_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P R V Y I G S L R E L N H N D N V E I Y G W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q D L K L L K N V S F L I M R D R T G T V Q V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F K N T P D I V N L L K E L P R E S V L K I S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K I N K K S V S K S G L E V S G E S V E V L N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E R P L P L P V I D P V Q A D L E T R L N N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F I D L R K R D V S S I F N A E S S I L W G I R
- - - - - - - - - - - - - - A E S S I L W G I R
------------------------------------------GCAGAGAGTTCCATTCTCTGGGGTATAAGG
145146147148149150151152153154155156157158159160161162163164165166167168
E F L H S Q G F I E V H T P K I V A A A T E G G
E F L H S Q G F I E V H T P K I V - - - - - - -
GAATTCCTACATTCACAGGGCTTCATAGAGGTCCACACCCCAAAAATAGTT---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A D L F P V K Y F E N D A Y L N Q S P Q L Y K E
- - - - - - - - - - - - - Y L N Q S P Q L Y K E
---------------------------------------TACCTTAATCAAAGCCCACAACTATACAAAGAA
193194195196197198199200201202203204205206207208209210211212213214215216
I L M S S G F E K V F E V G P A F R A E E H N T
- - - - - - - E K V F E V G P A F R A - - - - -
---------------------GAGAAGGTGTTCGAAGTTGGCCCGGCATTTAGGGCC---------------
217218219220221222223224225226227228229230231232233234235236237238239240
T R H L N E F T S I D I E M S F A D H N D A M R
- - - - N E F T S I D I E M S - - - H N D A M R
------------AACGAATTCACATCTATTGATATAGAGATGAGC---------CATAACGACGCAATGCGT
241242243244245246247248249250251252253254255256257258259260261262263264
I L E N A V K S G I E N M I N E N G K D L Q E N
I L E N A V K - - - - - - - - - - - - - - - - -
ATTCTAGAAAACGCTGTCAAA---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G I N I S I P E I P F P R I T Y K E C I K L L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K E G L E F Q F G N D F S P E E L R I I G R N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K D F Y F I T E W P S S L R P F Y T M P N R D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P T I T N S F D L Q Y R E V E V T S G A Q R V H
- - - - - S F D L Q Y - - - E V T S G A Q R - -
---------------TCATTCGATCTGCAGTAC---------GAAGTTACTTCAGGCGCGCAAAGG------
361362363364365366367368369370371372373374375376377378379380381382383384
D P D L L L K R F N E K K L N I D S F K F Y I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A F K Y G M P P H A G W G L G L E R L T M I V L
- - - - - - P P H A G W G L G L E R L T M I - -
------------------CCCCCACATGCTGGCTGGGGGCTCGGCCTTGAAAGACTCACCATGATT------
409410411412413414415416417418419420421422423424425426427428
G L N N I R E T T L F P R D R T R I I P
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_asp_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M M K D Y Y I K N V T Q D L D G K E V T L A G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V H N I R D L G G K K F L L L R D K T G I G Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V V D K S S P S F Q E I S D I S Q E S V I M V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G V V K A D N R A P N G V E V H A K E I K I L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K A K S P L P L D V S G K V K A D I D T R L K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R V L D L R R Q E M Q S I L K I Q N I T L K S F
- - - - - - - - - - - - - - - I Q N I T L K S F
---------------------------------------------ATACAAAATATTACTCTGAAATCGTTT
145146147148149150151152153154155156157158159160161162163164165166167168
R E T L Y K E G F V E V F T P K I I A S A T E G
R E T L Y K E G F V E V F T P K I I - - - - - -
AGAGAAACTTTATATAAAGAGGGTTTCGTGGAAGTATTTACACCGAAAATAATA------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G A Q L F S V I Y F G E T A F L A Q S P Q L Y K
- - - - - - - - - - - - - - F L A Q S P Q L Y K
------------------------------------------TTTTTAGCTCAAAGTCCACAGTTATACAAA
193194195196197198199200201202203204205206207208209210211212213214215216
E L L A G V V E K V F E I A P A W R A E D S D T
E - - - - - - E K V F E I A P A W R A - - - - -
GAG------------------GAAAAGGTGTTTGAGATTGCTCCTGCATGGAGAGCT---------------
217218219220221222223224225226227228229230231232233234235236237238239240
P Y H L A E F I S M D V E M A F G N Y E D T M K
- - - - A E F I S M D V E M A - - - Y E D T M K
------------GCAGAGTTCATAAGTATGGATGTAGAAATGGCA---------TATGAAGACACGATGAAA
241242243244245246247248249250251252253254255256257258259260261262263264
L L E K L I Y N I V N S V K S E A S D E L K I L
L L E K L I Y - - - - - - - - - - - - - - - - -
CTTCTAGAGAAACTAATTTAT---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S H N L P D V K I P I K R L T Y K D A I E I L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S K G Y N I K F G D D I G T P E S R V L Y N E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K E D L Y F I T D W P T L S R P F Y T K S K D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D P N V S E S F D L I Y R W L E I A S G S T R N
- - - - - - S F D L I Y - - - E I A S G S T R -
------------------AGTTTTGATTTAATATAC---------GAGATAGCTTCAGGTAGCACCAGA---
361362363364365366367368369370371372373374375376377378379380381382383384
H K R E V L E D S L R K R G L K P E N F E F F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R W F D Y G M P P H T G F G M G F A R L L V M L
- - - - - - - P P H T G F G M G F A R L L V M -
---------------------CCTCCCCACACAGGATTTGGAATGGGTTTTGCTAGACTTTTAGTGATG---
409410411412413414415416417418419420421422423424425426427428429
T G I H N V K E I V P F P R D K K R L V P
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_asp_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L K D A Y T A D V T P E R D G E E V R L A G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V H E V R D L G G I K F V L L R D R T G I V Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T L P K Q K V P K E T F E K V P K L T K E S V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R V E G T V Q A N E K A P G G V E V I P Q R I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V L S E S D T H L P L D P T G K V D A D L D T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L D A R V L D L R R E E P Q A I F K I R N V V T
- - - - - - - - - - - - - - - - - - I R N V V T
------------------------------------------------------CTCGGACAGCAGGTCTAG
145146147148149150151152153154155156157158159160161162163164165166167168
T A I R E F L E E R G F I E V H T P K I I A S A
T A I R E F L E E R G F I E V H T P K I I - - -
GGTCTCCTCGTACGTTATACGCTCGAACGGTGTCTCCAGCTCCGGTAGCTCCCGATCCAATGC---------
169170171172173174175176177178179180181182183184185186187188189190191192
T E G G T E L F P V V Y F E R D A Y L A Q S P Q
- - - - - - - - - - - - - - - - - Y L A Q S P Q
---------------------------------------------------GAGTACCCGCATCACGTCCTC
193194195196197198199200201202203204205206207208209210211212213214215216
L Y K Q M L M A A G F E R V Y E I G P I F R A E
L Y K Q - - - - - - - E R V Y E I G P I F R A -
CTCGCTCTCTAT---------------------GGAGATGGCCTCGTTGAGGTGTCGCCGCGTGTTGTG---
217218219220221222223224225226227228229230231232233234235236237238239240
E H N T R R H L N E A I S V D I E M S F I E S E
- - - - - - - - N E A I S V D I E M S - - - - E
------------------------CTCGTAAACGCGCTCGAAGCCCGCGGCCATGAG------------AAG
241242243244245246247248249250251252253254255256257258259260261262263264
E D V M R V L E E L L A H V F R K V R E E C E K
E D V M R V L E E L L A - - - - - - - - - - - -
CTGTGGGCTCTGCGCCAGGTACGCATCCCTCTCGAA------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E L E A L D R E L P E L E T P F E R I T Y E E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L D L L S E H G I E V E W G E D L P T E A E R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L G E I F E E P F F I T E W P R E T R P F Y T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A K D D E V T T A F D L M Y Q G L E L A S G A Q
- - - - - - - - A F D L M Y - - - E L A S G A Q
------------------------GACGCCTCCCGGAGCCTT---------CTGGACCGTACCCTCGACACG
361362363364365366367368369370371372373374375376377378379380381382383384
R E H R Y D V L V R Q I E E Q G L S P E D F R H
R - - - - - - - - - - - - - - - - - - - - - - -
GAT---------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y L E A F K Y G M P P H G G W G L G L E R T L M
- - - - - - - - - P P H G G W G L G L E R T L M
---------------------------CAGGAGGACGAACTTGATCCCTCCTAGGTCCCTTACCTCGTGCAC
409410411412413414415416417418419420421422423424425426427428429430431
T I T G A E N I R E V T L F P R D R K R L H P
T - - - - - - - - - - - - - - - - - - - - - -
CCA------------------------------------------------------------------
Class II
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_asp_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R V P I N T I T P D T P S A E V I G W A H E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R D L G G L A F L L I R D R T G I I Q V T V P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K K V A P E I A E T I R A I S R E S V V R V T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T V K P E G K A P G G R E L I P D A I E I V S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S A T P L P L D V A E K V P A E L D T R L D N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F L D A R R P R V S A I F K I R N A V Q H A T R
- - - - - - - - - - - - - - I R N A V Q H A T R
------------------------------------------ATCCGAAACGCTGTTCAGCATGCAACACGG
145146147148149150151152153154155156157158159160161162163164165166167168
N F F F E N G F I E I N T S K I V A A A T E G G
N F F F E N G F I E I N T S K I V - - - - - - -
AACTTTTTCTTTGAAAACGGGTTTATCGAGATTAATACCTCAAAGATCGTC---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T E L F P I A Y F E K E A F L N Q S P Q L Y K Q
- - - - - - - - - - - - - F L N Q S P Q L Y K Q
---------------------------------------TTCCTGAATCAGAGCCCGCAGCTCTACAAGCAG
193194195196197198199200201202203204205206207208209210211212213214215216
M M M A A G F E K V Y E I G P I F R A E E H N T
- - - - - - - E K V Y E I G P I F R A - - - - -
---------------------GAGAAGGTCTATGAGATCGGTCCGATCTTCCGTGCT---------------
217218219220221222223224225226227228229230231232233234235236237238239240
T K H L N E A T S I D I E V S F T D H L G V M Q
- - - - N E A T S I D I E V S - - - H L G V M Q
------------AATGAGGCGACATCCATCGATATTGAAGTCTCA---------CATCTCGGGGTCATGCAG
241242243244245246247248249250251252253254255256257258259260261262263264
T L E D L I R D I Y Q F V D K T C S D A I A D L
T L E D L I R - - - - - - - - - - - - - - - - -
ACGCTCGAAGATCTGATAAGG---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G L D D F A V P E K G F P R L P Y S E A I E I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S A T C E E D I A Y G D D I G T A A E R A I G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E M G R L Y F I V D W P S S I R P Y Y A M P Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N D P E I C K A F D M M H P R M E L S S G A Q R
- - - - - - - A F D M M H - - - E L S S G A Q R
---------------------GCCTTTGATATGATGCAC---------GAACTCTCATCCGGTGCCCAGCGG
361362363364365366367368369370371372373374375376377378379380381382383384
V H Q H D L L V E Q I A K K G L N P E N F E F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L N P F R F G M P P H A G W G L G A E R L V T T
- - - - - - - - P P H A G W G L G A E R L V T T
------------------------CCGCCCCATGCGGGCTGGGGACTTGGTGCCGAGCGTCTCGTAACGACC
409410411412413414415416417418419420421422423424425426427428429430
M L G L P N V R E A V L F P R D R H R V V P
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Archaea/Archaeoglobus fulgidus/amino acid sequences/asp_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R V Y T A D V K P E M E G Q K V T L Y G W V H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E V R D L G G L V F I L L R D R E G I V Q I T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P R K F V S K Q V F K L A K K I R R E S V I A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T G E V R R E E K A P G G V E I I P E S I E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N E A D A P L P L E V T E K V P A E L D T R L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
H R F M D L R R P R V Q A I F R I R H Q V M Q S
- - - - - - - - - - - - - - - - I R H Q V M Q S
------------------------------------------------ATAAGGCATCAGGTGATGCAGAGC
145146147148149150151152153154155156157158159160161162163164165166167168
V R E F L S E E G F I E V H T P K I V S T A T E
V R E F L S E E G F I E V H T P K I V - - - - -
GTGAGAGAATTTCTGTCAGAGGAGGGTTTCATTGAAGTGCACACACCAAAGATTGTT---------------
169170171172173174175176177178179180181182183184185186187188189190191192
G G T E L F P I S Y F E K E A F L N Q S P Q L Y
- - - - - - - - - - - - - - - F L N Q S P Q L Y
---------------------------------------------TTCCTCAACCAGAGCCCCCAGCTATAC
193194195196197198199200201202203204205206207208209210211212213214215216
K Q V L M A A G F E K V F E I G P I F R A E E H
K Q - - - - - - - E K V F E I G P I F R A - - -
AAGCAG---------------------GAGAAGGTCTTTGAAATTGGCCCGATTTTCAGGGCC---------
217218219220221222223224225226227228229230231232233234235236237238239240
N T T R H L N E A I S I D I E M S F T D H N G V
- - - - - - N E A I S I D I E M S - - - H N G V
------------------AATGAAGCAATCTCCATCGACATTGAGATGAGC---------CACAACGGAGTC
241242243244245246247248249250251252253254255256257258259260261262263264
M D V L E R L V Q R V Y E D V A E K C E R Y L G
M D V L E R L V Q - - - - - - - - - - - - - - -
ATGGACGTCCTTGAAAGGCTCGTTCAG---------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
W L E V S L E I P E L P F P R I T Y D E A R E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A A R K G E E I P W G E D L S T N A L K L V G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E M G G L Y F I T D W P T E S K P F Y A M P Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D R P E I S K S F D L M H G W L E L S S G A Q R
- - - - - - - S F D L M H - - - E L S S G A Q R
---------------------AGCTTCGACTTAATGCAC---------GAGCTTTCGAGCGGAGCCCAGAGA
361362363364365366367368369370371372373374375376377378379380381382383384
I H L Y D M L V E S I K A K G M E P E S F G F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L E A F R Y G M P P H A G W G L G A E R L I M S
- - - - - - - - P P H A G W G L G A E R L I M S
------------------------CCGCCCCATGCAGGCTGGGGACTTGGAGCTGAGAGGCTCATCATGTCC
409410411412413414415416417418419420421422423424425426427428429430
M L G L K N V R E A V L F P R D R H R L V P
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_asp_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L L G D L R R T H Y S K D I E P E M D G D E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T V M G W V H E I R D L G G I I F V L L R D R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G L I Q I T A P S K K I E K D L F K S I R K L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K E S V V A F G G T V Q E S G K A P G G F E I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P S F L K V L N I S K Q P L P L D P T E K V K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E I D T R L D A R F L D L R K P S V S A I F K I
- - - - - - - - - - - - - - - - - - - - - - - I
---------------------------------------------------------------------ATA
145146147148149150151152153154155156157158159160161162163164165166167168
K S R M L H S V R V F L E E Q G F L E I N T P K
K S R M L H S V R V F L E E Q G F L E I N T P K
AAAAGCAGAATGCTGCATTCAGTCAGGGTATTCCTTGAAGAACAGGGATTCCTCGAGATAAACACCCCAAAG
169170171172173174175176177178179180181182183184185186187188189190191192
L V A S A T E G G T E L F P I T Y F E R E A F L
L V - - - - - - - - - - - - - - - - - - - - F L
TTAGTT------------------------------------------------------------TTCCTC
193194195196197198199200201202203204205206207208209210211212213214215216
G Q S P Q L Y K Q I M M S T G L D R V Y E I A P
G Q S P Q L Y K Q - - - - - - - D R V Y E I A P
GGCCAGAGCCCACAGCTGTACAAGCAG---------------------GACCGTGTGTACGAAATCGCCCCA
217218219220221222223224225226227228229230231232233234235236237238239240
I F R A E E H D T L R H L N E V I S I D I E A S
I F R A - - - - - - - - - N E V I S I D I E A S
ATATTCAGGGCA---------------------------AACGAGGTCATATCAATCGACATCGAGGCATCC
241242243244245246247248249250251252253254255256257258259260261262263264
F V D H E D V M K I L E N L V V R V I E D V N E
- - - H E D V M K I L E N L V V - - - - - - - -
---------CACGAGGACGTGATGAAGATACTTGAAAACCTCGTGGTG------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H C T D A L E T L G R T L E V P E T P F E R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y D E A V E M V N S K G V P M K H G E D L P R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A E K A L G E I M D G Y Y F I T S W P T A I K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F Y V M P D E D D P E R S H A F D L M Y R D L E
- - - - - - - - - - - - - - A F D L M Y - - - E
------------------------------------------GCATTTGACCTCATGTAC---------GAG
361362363364365366367368369370371372373374375376377378379380381382383384
I S S G A M R V H Q H D L L V E K I K R Q G L N
I S S G A M R - - - - - - - - - - - - - - - - -
ATATCCTCAGGGGCCATGAGG---------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P D S F E S Y L S A F E Y G M P P H A G W G L G
- - - - - - - - - - - - - - - P P H A G W G L G
---------------------------------------------CCACCCCACGCAGGATGGGGACTCGGT
409410411412413414415416417418419420421422423424425426427428429430431432
A E R F N M T L T G L K N I R E T V L F P R D R
A E R F N M T - - - - - - - - - - - - - - - - -
GCTGAGAGGTTCAACATGACC---------------------------------------------------
433434435436437
R R L T P
- - - - -
---------------
Class II
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_asp_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y P K K T H W T A E I T P N L H G T E V V V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G W V W E L R D I G R V K F V V V R D R E G F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q V T L K A G K T P D H L F K V F A E L S R E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V V V I K G I V E A S K I A K S G V E I F P S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I W I L N K A K P L P I D I W S E T P D L A T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L K W R S V D L K R P R N L V V F T V A S A M L
- - - - - - - - - - - - - - - - - - V A S A M L
------------------------------------------------------TTGTCTAAGTCTGTCCAC
145146147148149150151152153154155156157158159160161162163164165166167168
R S I R E V L Y G E G F V E V F T P K I I V T S
R S I R E V L Y G E G F V E V F T P K I I - - -
CGCCTCGTCGTAATCAACTCTGGGAATATTGGACAACTCCATCAGCGCTTTAATACCCACTTC---------
169170171172173174175176177178179180181182183184185186187188189190191192
T E G G A E L F P V M Y F E R V A Y L S Q S P Q
- - - - - - - - - - - - - - - - - Y L S Q S P Q
---------------------------------------------------GATGTCCATTATATCGTTGTA
193194195196197198199200201202203204205206207208209210211212213214215216
L Y K E Q L T A S L E R V F E I G P A Y R A E K
L Y K E - - - - - - E R V F E I G P A Y R A - -
ATCCATAAATGC------------------AATGAATTCGTTGAGGTGATAGTCAGTGTTGTGTTT------
217218219220221222223224225226227228229230231232233234235236237238239240
H N T D Y H L N E F I S V D A E A A F M D Y N D
- - - - - - - N E F I S V D A E A A - - - Y N D
---------------------AAAAACCCTCTCCAGCGAGGCTGTGAGCTGCTC---------CTGCGGACT
241242243244245246247248249250251252253254255256257258259260261262263264
I M D I L E K I M R R L A S T V S E Y A P K L E
I M D I L E K I M R - - - - - - - - - - - - - -
TTGGGAAAGGTAAGCTACTCTTTCGAAGTA------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E V G I K A L M E L S N I P R V D Y D E A V D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L R Q L G Y A V N W G D D F T V E M Q K A L M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y Y G P V Y F I V N F P A S L R P F Y T K R K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G E K S E S Y D L I I N G I E V A S G A T R I H
- - - - - S Y D L I I - - - E V A S G A T R - -
---------------ACTTTTGGCAATTTTACT---------AATGCCTTTAATTACCACGACGTC------
361362363364365366367368369370371372373374375376377378379380381382383384
K R D E L E E E M K K R G L D P R L F E S H L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V F D Y G M P P H A G F G L G F N R L V T A L L
- - - - - - P P H A G F G L G F N R L V T A - -
------------------CACGAACTTCACTCTCCCAATGTCTCTCAACTCCCATACCCAACCGGC------
409410411412413414415416417418419420421422423424425426427428
G L D N V R H A T L Y P R D R Y R V E P
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_asp_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P R T Y I D T L R D H E D G A K V V V Y G W M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q E A R I M K N I S F L M I R D N T G T I Q A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F K N D E A T L D I I K R I N R E S I V R V D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S V N K K S I S K A G I E I S G T S I S I V N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E A P L P L P V V D P V Q A D L E T R L N S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F M D L R K R N I S A I F R I E S A L L W G I R
- - - - - - - - - - - - - - I E S A L L W G I R
------------------------------------------ATAGAAAGCGCACTTCTATGGGGCATAAGG
145146147148149150151152153154155156157158159160161162163164165166167168
Q Y L H S Q K F I E V H T P K I V A A A T E G G
Q Y L H S Q K F I E V H T P K I V - - - - - - -
CAGTATCTCCATAGCCAAAAGTTCATAGAGGTGCATACTCCGAAGATAGTG---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S D L F P V R Y F E K D A Y L N Q S P Q L Y K E
- - - - - - - - - - - - - Y L N Q S P Q L Y K E
---------------------------------------TACCTCAACCAGAGCCCACAGCTCTATAAAGAG
193194195196197198199200201202203204205206207208209210211212213214215216
V L M S A G F D R V F E V G P A F R A E E H N T
- - - - - - - D R V F E V G P A F R A - - - - -
---------------------GACCGAGTATTTGAAGTTGGCCCGGCATTTCGCGCC---------------
217218219220221222223224225226227228229230231232233234235236237238239240
T R H L N E F T S I D I E M S F A D H N D A M A
- - - - N E F T S I D I E M S - - - H N D A M A
------------AATGAATTCACCTCCATAGATATAGAGATGAGC---------CATAATGATGCTATGGCT
241242243244245246247248249250251252253254255256257258259260261262263264
M L E N A I R S G I E N A V R E N A E D F E S L
M L E N - - - - - - - - - - - - - - - - - - - -
ATGCTGGAGAAT------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G I S I S V P E T P F P R I T Y E Q C I D L L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D G I D F T F G D D F S P D Q L R T I G S R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S G F Y F I T E W P S S V R P F Y T M P K S E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P R L T N S F D L Q Y R E I E V T S G A Q R V H
- - - - - S F D L Q Y - - - E V T S G A Q R - -
---------------TCATTCGATCTGCAATAT---------GAAGTTACCTCAGGGGCACAGAGG------
361362363364365366367368369370371372373374375376377378379380381382383384
D P K M L I Q R F N E K K L D V K S F Q F Y V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A F K Y G M P P H A G W G L G L E R L T M I L L
- - - - - - P P H A G W G L G L E R L T M I - -
------------------CCCCCACATGCTGGTTGGGGGCTTGGCCTTGAACGCCTAACCATGATT------
409410411412413414415416417418419420421422423424425426427428
G L N N I R E T T L F P R D R T R I V P
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_asp_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S L Y L M Q I K G W V H K V R D L G K I K F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L I R D G Y K I M Q A V I K K G E S P D Y L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L D I P I E S A V E I E G E E R E T N G K K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L V K D L K I L A K A E P L P I D P K K A T P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K R F D Y R I I D L K L P E R Q T L F R L R A K
- - - - - - - - - - - - - - - - - - - - L R A K
------------------------------------------------------------TTAAGGGCCAAA
121122123124125126127128129130131132133134135136137138139140141142143144
V Q K F F R D W F M E N G F V E I N T P K I V I
V Q K F F R D W F M E N G F V E I N T P K I V -
GTACAAAAATTCTTTAGAGATTGGTTTATGGAAAATGGTTTTGTCGAAATAAATACTCCTAAAATAGTT---
145146147148149150151152153154155156157158159160161162163164165166167168
I G A E S G A E V F P V L Y F G K E A Y L T Q S
- - - - - - - - - - - - - - - - - - - Y L T Q S
---------------------------------------------------------TATTTAACACAATCT
169170171172173174175176177178179180181182183184185186187188189190191192
P Q L Y K Q M M V S V F P K V F E I A F A Y R A
P Q L Y K Q - - - - - - P K V F E I A F A Y R A
CCCCAATTGTATAAACAA------------------CCAAAGGTATTCGAAATTGCTTTCGCTTATAGGGCA
193194195196197198199200201202203204205206207208209210211212213214215216
E P S R T S R H L A E F T S V D A E M G F I K D
- - - - - - - - - A E F T S V D A E M G - - - -
---------------------------GCAGAATTCACTTCTGTAGATGCTGAAATGGGA------------
217218219220221222223224225226227228229230231232233234235236237238239240
E Y D V I N T I K K M L I D V S E K A M Q T K E
E Y D V I N T I K K M L I - - - - - - - - - - -
GAATATGATGTTATTAATACAATAAAGAAAATGTTAATC---------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F E E L A K P I D L G F E I I T F D E A K E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K G N P N E D L T T E E E R K L G E H F M E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V S F V A V T K Y P W S E R P F Y T M R L D D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P S Y T R G F D I I F R G L E I I S G A Q R E H
- - - - - G F D I I F - - - E I I S G A Q R - -
---------------GGTTTTGATATTATATTT---------GAAATAATAAGTGGGGCACAAAGA------
337338339340341342343344345346347348349350351352353354355356357358359360
R Y E K L L E N I K E K G I D P N K L E Y Y L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A F K Y G M P P H G G F G L G L E R Y L R Q L L
- - - - - - P P H G G F G L G L E R Y L R Q - -
------------------CCCCCTCATGGGGGATTTGGATTGGGATTAGAGAGGTATTTAAGACAA------
385386387388389390391392393394395396397398399400401402403404
G L D D V R E V I L F Y R D I D R L L P
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_asp_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y A L G D W R R T H Y S S E V N S E M D G Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I I I M G W N H S I R K L G K L V F I I L R D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E G T I Q I V A P K Q K V S E E T F A T A K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G K E D V M A I K G K V V A N E K A P A G F E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I P I E I K I L N K A D T P L P L D P S E K V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A D I D T R L D K R F L D L R R P K I Q S L F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L R S E V L K S I R N T F H D N G F I D V D T P
L R S E V L K S I R N T F H D N G F I D V D T P
TTAAGGTCTGAGGTATTAAAATCTATTAGAAATACTTTTCATGACAACGGATTTATTGATGTAGATACCCCA
169170171172173174175176177178179180181182183184185186187188189190191192
K L V A S A T E G G T E L F P I S Y F D K E A F
K L V - - - - - - - - - - - - - - - - - - - - F
AAACTTGTA------------------------------------------------------------TTT
193194195196197198199200201202203204205206207208209210211212213214215216
L G Q S P Q L Y K Q M M M A A G F D R V F E I G
L G Q S P Q L Y K Q - - - - - - - D R V F E I G
TTAGGACAAAGCCCACAGTTATATAAACAA---------------------GACAGAGTATTTGAAATTGGA
217218219220221222223224225226227228229230231232233234235236237238239240
P I F R A E E H N T R R H L N E A I S I D C E M
P I F R A - - - - - - - - - N E A I S I D C E M
CCAATATTTAGGGCA---------------------------AATGAGGCAATCTCAATTGACTGTGAAATG
241242243244245246247248249250251252253254255256257258259260261262263264
S F A D E K D A M E I L E K V I N N A F T D I Y
S - - - E K D A M E I L E K V I N - - - - - - -
TCA---------GAAAAAGATGCTATGGAAATACTTGAAAAGGTTATTAAT---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N N N Q K E L Q T L G I D L K V Q E T P F P R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E Y T E A V D M V N A K G V E M E W G E D F S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P A E A A L G E M M D G F Y F I T D W P T E I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P F Y T L P N E D N P K L C K A F D L M Y K D L
- - - - - - - - - - - - - - - A F D L M Y - - -
---------------------------------------------GCTTTTGACTTAATGTAT---------
361362363364365366367368369370371372373374375376377378379380381382383384
E I S S G A Q R N H K Y D L L V E G I K R M G L
E I S S G A Q R - - - - - - - - - - - - - - - -
GAAATATCCTCAGGAGCTCAAAGA------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N P E G F G T Y L E A F K Y G M P P H S G W G V
- - - - - - - - - - - - - - - - P P H S G W G V
------------------------------------------------CCCCCACACTCTGGTTGGGGAGTA
409410411412413414415416417418419420421422423424425426427428429430431432
G I E R L M M I M A C Q Q N I R E C V L F P R D
G I E R L M M I - - - - - - - - - - - - - - - -
GGTATTGAAAGACTTATGATGATT------------------------------------------------
433434435436437438
R Q R L T P
- - - - - -
------------------
Class II
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_asp_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S L A N L R T H Y T A E V K P E S V D N G Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I T L A G W I H E V R D L G G I C F V V L R D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E G K A Q V T L V K K K I D K E L F D A A R R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I R E S V I S V T G S V K F E E K A P N G Y E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L P E E I K V L N V A G S P L P M D T T G K V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A E L D T R L D S R F I D L R R A E T T A V F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I R H E A L Q A I R E Y F V K N K F I E T A T P
I R H E A L Q A I R E Y F V K N K F I E T A T P
ACAACGGCTGTTTACTATCTCGATTACCTCGTCATATGTAAGTTTCAGGAAAGGAGTCTTCGGAACTTTCAA
169170171172173174175176177178179180181182183184185186187188189190191192
K V V A T A T E G G T A L F P I T Y F D R E A F
K V V - - - - - - - - - - - - - - - - - - - - F
CTCAACCCC------------------------------------------------------------GTT
193194195196197198199200201202203204205206207208209210211212213214215216
L N Q S P Q L F K Q I L M G G G F D R V F E I G
L N Q S P Q L F K Q - - - - - - - D R V F E I G
TTCCAGAATTTCCATTACATCAAAGTGGTC---------------------GATAGAAGTGGCTTCGTTTAA
217218219220221222223224225226227228229230231232233234235236237238239240
P I F R A E E H D T R R H L N E A T S I D V E V
P I F R A - - - - - - - - - N E A T S I D V E V
GTGCCTGCGGGTATC---------------------------GATTTCAAAGACCCTGTCAAAACCGCCGCC
241242243244245246247248249250251252253254255256257258259260261262263264
S F A D H F D V M E I L E N L V A H I Y T R V I
S - - - H F D V M E I L E N L V A - - - - - - -
CAT---------TTTGAAGAGCTGGGGGCTCTGGTTAAGGAAAGCTTCCCT---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E N C K A S L E I L G V E L K V P K T P F L K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T Y D E V I E I V N S R C E E K M H W G D D L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T L G E H T V G N Y V Y E T T G E S H Y F I I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
W P T E I K P F Y A M P Y E D R P E F S K S F D
- - - - - - - - - - - - - - - - - - - - - S F D
---------------------------------------------------------------TTCTTCGAA
361362363364365366367368369370371372373374375376377378379380381382383384
M M H R T M E L S S G A Q R I H I S E L L K S R
M M H - - - E L S S G A Q R - - - - - - - - - -
CTTGACAGA---------GGAAATCACGGACTCGCGGATGAG------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I E S Q G L N P D G F E F Y L K A F E Y G M P P
- - - - - - - - - - - - - - - - - - - - - - P P
------------------------------------------------------------------CCCTCC
409410411412413414415416417418419420421422423424425426427428429430431432
H A G W G M G C E R F V M T M L G T E N I R D T
H A G W G M G C E R F V M T - - - - - - - - - -
GAGGTCTCTGACCTCATGGATCCAGCCTGCAAGGGTAATTTT------------------------------
433434435436437438439440441442443444
V L F P R D R R R L S P
- - - - - - - - - - - -
------------------------------------
Class II
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_asp_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L R T H Y S N E I T E E L N G K R V K V A G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V Q E V K D L G G I K F I W I R D R E G I V Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T A P K K K V S Q E I F K L I P K L N S E D V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V V E G I V N F T P K A K L G F E V I P E K L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V I S R A K T P L P L D P T G K V K A E L D T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L D N R F M D L R N P K V M A I F K I R S S V F
- - - - - - - - - - - - - - - - - - I R S S V F
------------------------------------------------------CCAGGGAATTTCTTTTCC
145146147148149150151152153154155156157158159160161162163164165166167168
R A V R E F F Y S E G F I E I H T P K I I A T A
R A V R E F F Y S E G F I E I H T P K I I - - -
TAAATCGCTGAGGATCTCCAGGGCTTTGTCATAAGTTATCCTGGGGAAGGGTCTTTTAGGCTC---------
169170171172173174175176177178179180181182183184185186187188189190191192
T E G G T E L F P L K Y F E R D A F L A Q S P Q
- - - - - - - - - - - - - - - - - F L A Q S P Q
---------------------------------------------------GACGTATGAGATCAACCTCTC
193194195196197198199200201202203204205206207208209210211212213214215216
L Y K Q M M M A T G L D K V F E I A P I F R A E
L Y K Q - - - - - - - D K V F E I A P I F R A -
AAGGAGATCCAT---------------------AAATGCCATCTCGGCATCTATGCTCCACGCTTCGTT---
217218219220221222223224225226227228229230231232233234235236237238239240
E H N T T R H L N E A W S I D A E M A F I E N E
- - - - - - - - N E A W S I D A E M A - - - - E
------------------------GGCCCTAAATATTGGAGCTATCTCAAAGACCTT------------GGC
241242243244245246247248249250251252253254255256257258259260261262263264
G E V M D L L E R L I S Y V I N Y V R E H N E K
G E V M D L L E R L I S - - - - - - - - - - - -
CATCATCATCTGCTTGTAAAGCTGGGGAGATTGGGC------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E L K T L E F E L N E P K R P F P R I T Y D K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L E I L S D L G K E I P W G E D I D T E G E K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L G K Y M A E N E G A D L Y F I Y R Y P S E A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P F Y I M K Y D E K P E V C R A F D L E Y R G V
- - - - - - - - - - - - - - - A F D L E Y - - -
---------------------------------------------AAATCCAAGCTTTGCTTT---------
361362363364365366367368369370371372373374375376377378379380381382383384
E I S S G G Q R E H R H D V L L E Q I K E K G L
E I S S G G Q R - - - - - - - - - - - - - - - -
GTTTACAATACCCTCAACGACTAT------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N P K S F E F Y L K A F E Y G M P P H G G F G L
- - - - - - - - - - - - - - - - P P H G G F G L
------------------------------------------------AATCCAGATGAACTTTATACCTCC
409410411412413414415416417418419420421422423424425426427428429430431432
G A E R L I M R M L D I G N I R E V I L F P R D
G A E R L I M R - - - - - - - - - - - - - - - -
TAAATCCTTAACCTCCTGCACCCA------------------------------------------------
433434435436437438
R R R L V P
- - - - - -
------------------
Class II
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_asp_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D Q H G H T L G R D L H G P R T H T C G E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R R A H V G Q E V V L K G W V D T R R D L G G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I F I D L R D R Y G L T Q I V F S P Q D N E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y R L A D R L R S E Y V I S V R G V V R E R S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E T V N P R L A T G E V E V R A H D L I I L N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S E P L P F P V S A H E E K R T T T S E E L R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K Y R Y L D L R R P E L Q R N L L L R H Q V Y L
- - - - - - - - - - - - - - - - - L R H Q V Y L
---------------------------------------------------CTGCGCCACCAGGTCTATCTG
169170171172173174175176177178179180181182183184185186187188189190191192
I T R R Y F D A H Q F V E V E T P V L T K S T P
I T R R Y F D A H Q F V E V E T P V L T - - - -
ATCACCCGACGCTACTTCGACGCGCATCAGTTCGTCGAAGTCGAAACGCCCGTGCTGACC------------
193194195196197198199200201202203204205206207208209210211212213214215216
E G A R D F L V P S R L H P G K F Y A L P Q S P
- - - - - - - - - - - - - - - - - - A L P Q S P
------------------------------------------------------GCGCTGCCCCAGTCGCCG
217218219220221222223224225226227228229230231232233234235236237238239240
Q L Y K Q I L M V A G L D R Y F Q I V K C F R D
Q L Y K Q - - - - - - - D R Y F Q I V K C F R D
CAGCTCTACAAACAG---------------------GATCGCTACTTCCAGATCGTCAAGTGCTTCCGCGAC
241242243244245246247248249250251252253254255256257258259260261262263264
E D L R A D R Q P E F T Q I D V E M T F P T E E
- - - - - - - - P E F T Q I D V E M T - - - E E
------------------------CCGGAATTCACCCAGATCGATGTGGAGATGACC---------GAGGAG
265266267268269270271272273274275276277278279280281282283284285286287288
Q I F E L I E G L I Q A I W R E T L G V E L P R
Q I F E L I E G L I Q - - - - - - - - - - - - -
CAGATTTTTGAACTCATCGAAGGGCTTATCCAG---------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P F P R M S Y D E A L R R F G S D K P D T R F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L E L Q E I G E V F R G S G F R V F E S V L E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G G E I V A L V V P G M G D Q G R G Y M D R L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K D V V R K Q I G A G G L V Y F K L P S D G G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I Y S S V K E H V L P S A Y V Q R A V A K L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R A G D L V L L L A G P R P Q V Y L Q A G A L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L H M A R E L N L I P P A G Q A P W H F L W V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D F P L L E W D E E A G R Y F A M H H P F T S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
H P D D L D L L E T D P G R V R A R A Y D L V L
- - - - - - - - - - - - - - - - - - A Y D L V L
------------------------------------------------------GCCTACGACCTGGTGCTG
505506507508509510511512513514515516517518519520521522523524525526527528
N G N E I G G G S I R I H R Q D I Q R R M F R V
- - - E I G G G S I R - - - - - - - - - - - - -
---------GAGATCGGCGGCGGCTCGATCCGT---------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L G I D Q E E A E R R F G F L L T A F R Y G A P
- - - - - - - - - - - - - - - - - - - - - - - P
---------------------------------------------------------------------CCG
553554555556557558559560561562563564565566567568569570571572573574575576
P H G G I A L G L D R I V M L L A G A G S L R D
P H G G I A L G L D R I V M L - - - - - - - - -
CCACACGGCGGCATCGCGCTGGGCCTGGACCGCATCGTGATGCTG---------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V I A F P K T Q R G Q E L M S N A P D E V S P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619
Q L E E L H I R V V L P E T E A S G S
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Archaea/Staphylothermus marinus/Smarinus_asp_aa
Archaea/Staphylothermus marinus/Smarinus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I C G W I I R L K I V G K V V I I E V S G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T S V K P Y V L V L K K N R E P E L Y E E A K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L S V G T A L C F E G E K S P V Q K S K R G V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y I V K K L K I Y S K P L E P L P V D T V G K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P A L L D T R I K Y R Y L L V R N P V E K A I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R I R A G I I E A A R Q Y F N N N G F I E I H T
- I R A G I I E A A R Q Y F N N N G F I E I H T
---ATTAGAGCAGGAATTATTGAAGCAGCTAGACAATACTTTAACAATAATGGATTCATAGAGATACACACA
145146147148149150151152153154155156157158159160161162163164165166167168
P K I V A A G A E G G A T L F P V Q Y F E N K A
P K I V - - - - - - - - - - - - - - - - - - - -
CCTAAAATAGTA------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y L S Q S P Q L Y K Q M L I A G F P R V F E I T
Y L S Q S P Q L Y K Q - - - - - - P R V F E I T
TATCTTAGTCAGAGCCCACAATTATATAAACAA------------------CCAAGAGTATTTGAGATAACA
193194195196197198199200201202203204205206207208209210211212213214215216
P Y F R A E K F N T T R H L N E S W G I D A E Q
P Y F R A - - - - - - - - - N E S W G I D A E Q
CCTTATTTTAGGGCA---------------------------AATGAATCATGGGGTATTGATGCCGAGCAA
217218219220221222223224225226227228229230231232233234235236237238239240
G F I D S V E D V L N T L E D L I V Y I N N Y I
G - - - - V E D V L N T L E D L I V - - - - - -
GGA------------GTTGAAGATGTACTAAATACTCTTGAGGACCTCATAGTA------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R K N Y V E E Q E T L G I E I E K L D K P F K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L K F E E A I D L L R S E G L E V S E G E D L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D A A E K K L G E I M E E K G Y K I Y F I I G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P W Q A T G F Y Y M R E E D G Y H T R K F D L D
- - - - - - - - - - - - - - - - - - - K F D L D
---------------------------------------------------------AAATTTGATCTAGAC
337338339340341342343344345346347348349350351352353354355356357358359360
Y K G L E I A S G G Q R E H R Y D K L V S A L K
Y - - - E I A S G G Q R - - - - - - - - - - - -
TAT---------GAAATAGCTAGTGGTGGTCAGAGA------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D K G L N P E D F A F Y L E A F K Y G M P P H G
- - - - - - - - - - - - - - - - - - - - P P H G
------------------------------------------------------------CCTCCGCATGGT
385386387388389390391392393394395396397398399400401402403404405406407408
G F G L G I E R L M M K M L G L E N I R E A I L
G F G L G I E R L M M K - - - - - - - - - - - -
GGTTTTGGATTGGGTATTGAGCGTTTAATGATGAAA------------------------------------
409410411412413414415416417418
F V R D R T R L V P
- - - - - - - - - -
------------------------------
Class II
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_asp_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V N K M K W R R T H Y S A D I K P E M D G Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V I I M G W V H S I R A L G K I I F V I L R D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E G T V Q I V A P K Q K V G D E L F S Q I K K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G A E D V I A V K G K V I A N E K A P N G F E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L P L E L E V I N T A K R P L P L D P A E K V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A E L D T R L E N R F L D L R R P K V Q A I F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I R S E M L K S V R N T L Y N E G F I E V N T P
I R S E M L K S V R N T L Y N E G F I E V N T P
ATTAGAAGTGAAATGCTAAAATCTGTAAGAAACACACTCTATAATGAGGGCTTTATTGAGGTAAATACACCA
169170171172173174175176177178179180181182183184185186187188189190191192
K L V A S C T E G G T E L F P I S Y F E R E A F
K L V - - - - - - - - - - - - - - - - - - - - F
AAATTGGTA------------------------------------------------------------TTT
193194195196197198199200201202203204205206207208209210211212213214215216
L G Q S P Q L Y K Q M L M A T G L D R V F E I A
L G Q S P Q L Y K Q - - - - - - - D R V F E I A
TTAGGGCAGAGTCCTCAGTTGTATAAGCAG---------------------GATAGAGTTTTTGAAATAGCT
217218219220221222223224225226227228229230231232233234235236237238239240
P I F R A E E H N T R R H L N E A T S I D I E M
P I F R A - - - - - - - - - N E A T S I D I E M
CCAATATTTAGGGCT---------------------------AATGAAGCTACATCAATAGACATTGAAATG
241242243244245246247248249250251252253254255256257258259260261262263264
A F A D D K D A M D I L E K V V Y N A F V D V Y
A - - - D K D A M D I L E K V V Y - - - - - - -
GCA---------GATAAGGATGCTATGGATATATTGGAGAAAGTTGTTTAT---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E N R K K E I E T L G I E F E L P P E K F D R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T Y D E A I D I A N A K G V E I S W G E D L S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E A E K A I G E E M E G L Y F I T D W P S E I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P F Y T M P D E K N P N I C K A F D L M Y K D L
- - - - - - - - - - - - - - - A F D L M Y - - -
---------------------------------------------GCATTTGATTTAATGTAT---------
361362363364365366367368369370371372373374375376377378379380381382383384
E I S S G A Q R I H L Y D L L V E N I K K K G L
E I S S G A Q R - - - - - - - - - - - - - - - -
GAGATTTCTTCAGGAGCTCAAAGG------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N P D G F T Y Y L E A F K Y G M P P H A G W G L
- - - - - - - - - - - - - - - - P P H A G W G L
------------------------------------------------CCTCCACATGCAGGATGGGGATTA
409410411412413414415416417418419420421422423424425426427428429430431432
G A D R F T M V L T Q Q E N I R E C V L F P R D
G A D R F T M V - - - - - - - - - - - - - - - -
GGAGCGGATAGATTTACCATGGTA------------------------------------------------
433434435436437438
R Q R L T P
- - - - - -
------------------
Class II
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_asp_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L E R T Y I D D V S P D D D G S E T T I A G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V H E L R D L G G I L F V V V R D R T G L L Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V V K E D D T P E V F E R A E A L S S E D I V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V R G T L E A T D Q A P G G V E L A P E E L T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V S E A S G D L S I E I S K D V D A D L S T R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D E R H L D V R K P E S R A V F S L R S K A M G
- - - - - - - - - - - - - - - - - L R S K A M G
---------------------------------------------------CTGCGCTCGAAAGCGATGGGC
145146147148149150151152153154155156157158159160161162163164165166167168
A M R S W F Y D N E F E E V D T P E L S T A G A
A M R S W F Y D N E F E E V D T P E L S - - - -
GCGATGCGGTCGTGGTTCTACGACAACGAGTTCGAGGAGGTCGACACGCCGGAACTGTCG------------
169170171172173174175176177178179180181182183184185186187188189190191192
E G G A D L F P V V Y Y D Q E A Y L S Q S P Q L
- - - - - - - - - - - - - - - - Y L S Q S P Q L
------------------------------------------------TACCTCTCCCAGAGCCCGCAACTG
193194195196197198199200201202203204205206207208209210211212213214215216
Y K Q I L V A S G F D R L F E V G H A F R A E D
Y K Q - - - - - - - D R L F E V G H A F R A - -
TACAAGCAG---------------------GACCGCCTCTTCGAGGTCGGGCACGCGTTCCGCGCG------
217218219220221222223224225226227228229230231232233234235236237238239240
F G T S R H V S E I A M F D V E L G Y V E D H H
- - - - - - - S E I A M F D V E L G - - - - H H
---------------------TCCGAGATCGCGATGTTCGACGTCGAACTCGGC------------CACCAC
241242243244245246247248249250251252253254255256257258259260261262263264
D V M D V Q E E S L R H T I E A V V E R A G R E
D V M D V Q E E S L R - - - - - - - - - - - - -
GACGTGATGGACGTCCAGGAGGAGTCCCTGCGG---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L D V L D A D L A V P E E D F P R V T F E E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E I L R E E Y D H V P E D D T D L D T K G E R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L G E Y F E E R G H P A V F V V G Y P D E K F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y M Q G V P G D D V A S R K F D L L Y R G Q E L
- - - - - - - - - - - - - K F D L L Y - - - E L
---------------------------------------AAGTTCGACCTGCTGTAC---------GAACTC
361362363364365366367368369370371372373374375376377378379380381382383384
S S G G Q R E H D V D R L R E T M T A Q G V D P
S S G G Q R - - - - - - - - - - - - - - - - - -
TCCTCGGGCGGCCAGCGT------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E N F E F Y L D A F R Y G V P P H G G Y G L G I
- - - - - - - - - - - - - - P P H G G Y G L G I
------------------------------------------CCGCCCCACGGGGGGTACGGCCTGGGTATC
409410411412413414415416417418419420421422423424425426427428429430431432
D R L I Q Q L A G V D N V K E A I L F P R D P D
D R L I Q Q - - - - - - - - - - - - - - - - - -
GACCGCCTCATCCAGCAG------------------------------------------------------
433434435436
R L E P
- - - -
------------
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_asp_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y R S H T C G E L R P A H A G Q E V T L A G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V H R R R D H G D L I F I D L R D R Y G I T Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V F N S A N A A A H A V A E T V R S E Y V L Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R G K V R I R P A E A V N P D I A T G E I E V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A F E A Q V L N P A R T P P I Y I A K E A G E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E S V R L K Y R Y L D L R R E R M Q R N L I L R
- - - - - - - - - - - - - - - - - - - - - - L R
------------------------------------------------------------------TTACGC
145146147148149150151152153154155156157158159160161162163164165166167168
H R V V K F I R D F L D A E G F I E I E T P I L
H R V V K F I R D F L D A E G F I E I E T P I L
CATCGCGTGGTCAAGTTTATTCGCGACTTTCTCGATGCCGAGGGTTTTATCGAGATCGAAACACCGATTTTG
169170171172173174175176177178179180181182183184185186187188189190191192
I K S T P E G A R D Y L V P S R L H P G K F Y A
I - - - - - - - - - - - - - - - - - - - - - - A
ATC------------------------------------------------------------------GCC
193194195196197198199200201202203204205206207208209210211212213214215216
L P Q S P Q Q L K Q L L M V A G Y D K Y F Q I A
L P Q S P Q Q L K Q - - - - - - - D K Y F Q I A
TTGCCGCAAAGTCCACAGCAACTCAAGCAG---------------------GATAAATACTTTCAGATTGCC
217218219220221222223224225226227228229230231232233234235236237238239240
R C F R D E D Q R A D R Q P E F T Q L D M E M S
R C F R D - - - - - - - - P E F T Q L D M E M S
CGCTGTTTTCGTGAT------------------------CCCGAATTTACCCAACTTGATATGGAGATGAGC
241242243244245246247248249250251252253254255256257258259260261262263264
F V D Q E D V I N L I E R L F T E L C R T V T P
- - - Q E D V I N L I E R L F T - - - - - - - -
---------CAAGAGGATGTAATCAATCTGATCGAACGGCTCTTCACC------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H K R L L T P F R R L T Y A E A M E R Y G S D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P D L R Y D L E L V N L S D V L A E T P F Q V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R S V L A V G G Q V K G I R V P G C G H F S R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q I D E L T E V A R S G G A K G L A W A V V P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D G G D V R S S F A K N L A P G E F D A L A Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
M G A Q P G D L L L I V A D R P V V V A A S L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K L R R K L A D L L Q L A D P D T L C F A W V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D F P L V E W N E E E Q R W D A V H H P F T S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K D E D L H L L A T D P G K V R A K A Y D L I L
- - - - - - - - - - - - - - - - - - A Y D L I L
------------------------------------------------------GCTTACGATCTTATTCTC
481482483484485486487488489490491492493494495496497498499500501502503504
N G Y E A G G G S I R I H R R D V Q Q Q V F S L
- - - E A G G G S I R - - - - - - - - - - - - -
---------GAAGCCGGTGGTGGTAGTATTCGT---------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L G I G E E K A Q A Q F G H M L E A F E Y G A P
- - - - - - - - - - - - - - - - - - - - - - - P
---------------------------------------------------------------------CCG
529530531532533534535536537538539540541542543544545546547548549550551552
P H G G I A P G I D R L V M I L A D E P T I R E
P H G G I A P G I D R L V M I - - - - - - - - -
CCCCACGGTGGAATTGCGCCCGGCATCGATCGGTTGGTGATGATC---------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V M A F P K T Q Q A V D L M T N A P S P V D E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588
Q L K E L H I R I V E D
- - - - - - - - - - - -
------------------------------------
Class II
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_asp_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R S H Y N T D L G I S H V G Q S V K L C G W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N S Y R D H G G V I F I D L R D R S G I I Q L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
C D P N D S K E A H E I A S N A R N E F V L I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E G T I R P R G E G L V N P K L K T G E I E V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V S K L T I E N E S A V P P F A I A D E S V N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E L R L K Y R F L D L R N P K L Y E N F A L R S
- - - - - - - - - - - - - - - - - - - - - L R S
---------------------------------------------------------------ATAACTTCC
145146147148149150151152153154155156157158159160161162163164165166167168
K A C I A A R N S L A N M G F L E V E T P I L T
K A C I A A R N S L A N M G F L E V E T P I L T
GTCATCATTTTGCTCAAACATAGGAAAATCAACAACCCATAAGAATTCCAAGGCATTTGGATCTATAAGTTT
169170171172173174175176177178179180181182183184185186187188189190191192
K A T P E G A R D Y L V P S R V H Q G E F Y A L
- - - - - - - - - - - - - - - - - - - - - - A L
------------------------------------------------------------------ACCGAA
193194195196197198199200201202203204205206207208209210211212213214215216
P Q S P Q L F K Q L L M C S G F D R Y F Q I A K
P Q S P Q L F K Q - - - - - - - D R Y F Q I A K
AAATACCACATCTCCTACTTCAAGCTC---------------------TAAATCTTCTTCGCTAAAGAATTT
217218219220221222223224225226227228229230231232233234235236237238239240
C F R D E D L R A D R Q P E F T Q I D V E M S F
C F R D - - - - - - - - P E F T Q I D V E M S -
ACAAAGTGGACC------------------------TATGAAAGCTAAGCCTTGGGCGCCAAATTTACG---
241242243244245246247248249250251252253254255256257258259260261262263264
C E Q K D V I K V A E T F L K D I F K A C G K E
- - Q K D V I K V A E T F L K - - - - - - - - -
------TTCAAATCTTTGCATTTGTCTTTTTGAAAAAATAGTATC---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I Q T P F R Q M Q Y K D A M E N Y G S D K P D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R F D L K F I D V I D I F T K S N N E I F A N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A K D T K K N R I K A I R V P K G D T I F S K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q M Q R F E E F V R K F G A Q G L A F I Q V K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D G L K G P L C K F F S E E D L N E L S K R C E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L E V G D V V F F G A G A K K T V L D Y M G R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R I F L A N E L K L I D P N A L E F L W V V D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P M F E Q N D D G S Y S A M H H P F T M P K N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D E T D L E E I S S I A Y D V V L N G V E L G G
- - - - - - - - - - - A Y D V V L - - - E L G G
---------------------------------ACTTTCATCAGCGATAGC---------TACGGCACTTTC
481482483484485486487488489490491492493494495496497498499500501502503504
G S I R I H K N D I Q Q K V F K L L N I D E E Q
G S I R - - - - - - - - - - - - - - - - - - - -
ATTTTCTATGGT------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q K E K F G F L L D A L S F G A P P H G G I A I
- - - - - - - - - - - - - - - - P P H G G I A I
------------------------------------------------TGCATTGGAAGCGATTTCATGAGC
529530531532533534535536537538539540541542543544545546547548549550551552
G L D R L I M L V T G A N S I R E V I A F P K T
G L D R L I M L - - - - - - - - - - - - - - - -
TTCTTTACTATCATTTGGATCGCA------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q R A Q C L M T D A P S P A S N E A M R E L G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583
K L R E N I K
- - - - - - -
---------------------
Class II
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_asp_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S M R T E Y C G L V T E H L L G Q T V S L C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W V Q R R R D H G G V I F I D L R D R E G L V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V V C D P D R A E M F A T A E G V R N E F C V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V K G L V R N R P E G T V N A G L K S G K I E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L C H E L T V L N A S V T P P F Q L D D D N L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E T T R L T H R V L D L R R P Q M Q H N L R L R
- - - - - - - - - - - - - - - - - - - - - - L R
------------------------------------------------------------------CTGCGC
145146147148149150151152153154155156157158159160161162163164165166167168
Y R V A I E A R K Y L D E Q G F I D I E T P M L
Y R V A I E A R K Y L D E Q G F I D I E T P M L
TACCGCGTCGCGATCGAGGCGCGCAAGTATCTCGACGAGCAGGGTTTCATCGACATCGAAACGCCGATGCTG
169170171172173174175176177178179180181182183184185186187188189190191192
T K S T P E G A R D Y L V P S R V N A G Q F F A
T - - - - - - - - - - - - - - - - - - - - - - A
ACG------------------------------------------------------------------GCG
193194195196197198199200201202203204205206207208209210211212213214215216
L P Q S P Q L F K Q L L M V A N F D R Y Y Q I T
L P Q S P Q L F K Q - - - - - - - D R Y Y Q I T
CTGCCGCAGTCGCCGCAGCTGTTCAAGCAG---------------------GACCGTTACTACCAGATCACG
217218219220221222223224225226227228229230231232233234235236237238239240
K C F R D E D L R A D R Q P E F T Q I D C E T S
K C F R D - - - - - - - - P E F T Q I D C E T S
AAGTGCTTCCGCGAC------------------------CCGGAATTCACGCAGATCGACTGCGAGACGTCG
241242243244245246247248249250251252253254255256257258259260261262263264
F L G E Q E I R D L F E D M I R H I F K T T I D
- - - E Q E I R D L F E D M I R - - - - - - - -
---------GAGCAGGAAATTCGCGATCTGTTCGAGGACATGATCCGT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V E L D A K F P V M P Y S E A M A R F G S D K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D L R V K L E F T E L T D A M K D V D F K V F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T P A N T K D G R V A A L R V P K G A E L T R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D I D G Y T E F V R I Y G A K G L A W I K V N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A K G R D G L Q S P I V K N L H D A S I A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L E R T G A Q D G D I V F F A A D R A K V V N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S L G A L R L K I G H S E F G K A N G L V E S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
W K P L W V V D F P M F E Y D D E E A R Y V A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
H H P F T S P K D E H L E Y L E T D P G R C L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K A Y D M V L N G W E I G G G S V R I H R E E V
- A Y D M V L - - - E I G G G S V R - - - - - -
---GCGTACGACATGGTGCTG---------GAAATCGGCGGCGGCTCGGTGCGT------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q S K V F R A L K I G P E E A Q A K F G F L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A L Q Y G A P P H G G I A F G L D R I V T M M A
- - - - - - P P H G G I A F G L D R I V T M - -
------------------CCGCCGCACGGCGGCATCGCGTTCGGCCTCGATCGCATCGTCACGATG------
553554555556557558559560561562563564565566567568569570571572573574575576
G A D S I R D V I A F P K T Q R A Q C L L T Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
P S P V D E R Q L R E L H I R L R Q P E Q P K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_asp_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R T H Y C G E L R A E Q V G T S V T L Y G W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D R R R D H G G V I F V D L R D R T G T V Q I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S D P E R T P E S Y H Q A E G L R N E Y V V K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T G R V S G R P A E S L N P K L P T G E V E I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A D R I E I L N A V R R Q L P F Q V S S A D E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T V R E D L R L R Y R Y L D L R R D R M N R N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q L R H Q V V K A I R R F L E D E E Q F I E I E
- L R H Q V V K A I R R F L E . E E Q F I E I E
---CTGCGTCACCAAGTCGTCAAGGCGATTCGCCGCTTCTTGGAA---GAAGAACAATTTATCGAGATTGAA
169170171172173174175176177178179180181182183184185186187188189190191192
T P V L T K S T P E G A R D Y L V P S R V N P G
T P V L T - - - - - - - - - - - - - - - - - - -
ACACCCGTCCTGACC---------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E W F A L P Q S P Q L F K Q L L M V S G F D R Y
- - - A L P Q S P Q L F K Q - - - - - - - D R Y
---------GCCCTGCCGCAATCACCGCAGCTGTTTAAGCAA---------------------GATCGCTAC
217218219220221222223224225226227228229230231232233234235236237238239240
Y Q I A R C F R D E D L R A D R Q P E F T Q L D
Y Q I A R C F R D - - - - - - - - P E F T Q L D
TACCAAATTGCCCGCTGCTTCCGCGAT------------------------CCGGAATTTACCCAGCTCGAT
241242243244245246247248249250251252253254255256257258259260261262263264
M E M S F L S Q E E I I D L N E R L I A H I F K
M E M S - - - Q E E I I D L N E R L I A - - - -
ATGGAAATGAGC---------CAGGAAGAAATCATCGACCTGAACGAGCGGCTGATTGCT------------
265266267268269270271272273274275276277278279280281282283284285286287288
T V K G I E L P R P F P R L T Y A E A M D R Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S D R P D T R F G L E L V D V S D V V A D M G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K V F S G A V K S G G K V K I L P I P D G N D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I S N V R I K P G G D I F K E A T E A G A A G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A Y I R V R E N G E I D T I G A I K D N L S D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q K A E I L R R T Q A Q P G T L L L F G A G S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D I V N K S L D R V R Q F L G K E L G L I D P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A L N L L W V V D F P M V E W N A D E K R Y E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L H H P F T A P N P Q D L E D L T T A R A Q A Y
- - - - - - - - - - - - - - - - - - - - - - A Y
------------------------------------------------------------------GCCTAC
481482483484485486487488489490491492493494495496497498499500501502503504
D I V L N G L E I G G G S L R I Y Q R D I Q E R
D I V L - - - E I G G G S L R - - - - - - - - -
GACATCGTCCTC---------GAAATTGGCGGCGGTAGTCTGCGG---------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V F E T I G L S H E E A Q A K F G F L L E A F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
F G T P P H G G I A Y G L D R L V M L L T G E E
- - - P P H G G I A Y G L D R L V M L - - - - -
---------CCACCCCACGGCGGCATCGCCTACGGTCTCGATCGCCTTGTGATGTTG---------------
553554555556557558559560561562563564565566567568569570571572573574575576
S I R D A I A F P K T Q Q A R C L L T E A P A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599
V S D R Q L K E L Y V A S T W Q P P I K E R D
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_asp_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F R T H T C G E L R I S D V N K Q V K L S G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V Q R S R K M G G M T F V D L R D R Y G I T Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V F N E E I D A E L C E R A N K L G R E F V I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I V G T V N E R F S K N S H I P T G D I E I I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E L N I L N S A I T P P F T I E D N T D G G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D I R M K Y R Y L D L R R S A V R S N L E L R H
- - - - - - - - - - - - - - - - - - - - - L R H
---------------------------------------------------------------TTACGTCAC
145146147148149150151152153154155156157158159160161162163164165166167168
K M T I E V R S Y L D K L G F L E V E T P V L I
K M T I E V R S Y L D K L G F L E V E T P V L I
AAAATGACGATCGAGGTTCGCAGTTATCTCGATAAACTGGGTTTCTTGGAAGTGGAAACTCCGGTATTGATC
169170171172173174175176177178179180181182183184185186187188189190191192
G S T P E G A R D F V V P S R M N P G Q F Y A L
- - - - - - - - - - - - - - - - - - - - - - A L
------------------------------------------------------------------GCATTA
193194195196197198199200201202203204205206207208209210211212213214215216
P Q S P Q T L K Q L L M V S G F D R Y F Q I A K
P Q S P Q T L K Q - - - - - - - D R Y F Q I A K
CCGCAATCTCCGCAGACACTGAAACAG---------------------GATCGTTATTTCCAGATAGCCAAA
217218219220221222223224225226227228229230231232233234235236237238239240
C F R D E D L R A D R Q P E F T Q I D C E M S F
C F R D - - - - - - - - P E F T Q I D C E M S -
TGTTTCCGTGAC------------------------CCTGAGTTCACTCAGATTGACTGCGAAATGAGT---
241242243244245246247248249250251252253254255256257258259260261262263264
V E Q E D V I T T F E G M A K H L F K V I R N I
- - Q E D V I T T F E G M A K - - - - - - - - -
------CAGGAAGATGTGATTACTACATTTGAAGGAATGGCCAAA---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E L T E P F P R M P W S E A M R L Y G S D K P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I R F G M Q F V E L M D I L K G H G F S V F D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A T Y I G G I C A E G A A G Y T R K Q L D A L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E F V K K P Q I G A K G M V Y A R I E A D G T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K S S V D K F Y T Q E V L Q Q L K E A F G A K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G D L I L I L S G D D A M K T R K Q L C E L R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E M G N Q L G L R D K N T F A C L W V V D F P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F E W S E E E G R L M A M H H P F T S P K P E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I H L L D T N P A A V R A N A Y D M V I N G V E
- - - - - - - - - - - - - - A Y D M V I - - - E
------------------------------------------GCTTACGATATGGTAATC---------GAA
481482483484485486487488489490491492493494495496497498499500501502503504
V G G G S I R I H D S Q L Q N K M F E L L G F T
V G G G S I R - - - - - - - - - - - - - - - - -
GTAGGAGGGGGATCAATCCGT---------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P E R A Q E Q F G F L M N A F K F G A P P H G G
- - - - - - - - - - - - - - - - - - - P P H G G
---------------------------------------------------------CCTCCTCATGGCGGA
529530531532533534535536537538539540541542543544545546547548549550551552
L A Y G L D R W V S L F A G L D S I R D C I A F
L A Y G L D R W V S L - - - - - - - - - - - - -
CTGGCTTACGGATTAGATCGTTGGGTATCTCTT---------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P K N N S G R D V M L D A P A A L D P S Q L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585
L N L I V D I K E
- - - - - - - - -
---------------------------
Class II
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_asp_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q R T Y Y C G E V P E T A V G E R V I L K G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V Q K R R D L G G L I F I D L R D R T G I V Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V A S P D V S A E A L A A A E R V R S E Y V V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V E G T V V A R A P E T V N P N I A T G R I E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q A E R I D I I N E A K T P P F A I S D D T D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A E D V R L K Y R Y L D L R R P V M F Q T L A L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------CTT
145146147148149150151152153154155156157158159160161162163164165166167168
R H K V T K A V R D F L D S E R F L E I E T P M
R H K V T K A V R D F L D S E R F L E I E T P M
CGCCATAAAGTGACGAAAGCGGTGCGCGACTTTTTGGATAGCGAACGCTTTTTGGAAATTGAAACGCCGATG
169170171172173174175176177178179180181182183184185186187188189190191192
L T K S T P E G A R D Y L V P S R V H P G E F Y
L T - - - - - - - - - - - - - - - - - - - - - -
TTGACG------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A L P Q S P Q I F K Q L L M V G G V E R Y Y Q I
A L P Q S P Q I F K Q - - - - - - - E R Y Y Q I
GCCTTGCCGCAGTCGCCGCAAATTTTTAAGCAG---------------------GAACGGTACTACCAAATC
217218219220221222223224225226227228229230231232233234235236237238239240
A R C F R D E D L R A D R Q P E F T Q I D I E M
A R C F R D - - - - - - - - P E F T Q I D I E M
GCCCGTTGCTTCCGTGAC------------------------CCGGAATTTACGCAAATCGACATCGAAATG
241242243244245246247248249250251252253254255256257258259260261262263264
S F I E Q K D I M D L T E R M M A A V V K A A K
S - - - Q K D I M D L T E R M M A - - - - - - -
TCG---------CAAAAGGATATTATGGATTTAACCGAACGGATGATGGCT---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G I D I P R P F P R I T Y D E A M S R Y G S D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P D I R F G L E L V D V S E I V R N S A F Q V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A R A V K E G G Q V K A I N A K G A A P R Y S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K D I D A L G E F A A R Y G A K G L A W L K A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G D E L K G P I A K F F T A D E Q T A L R Q L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A V D D G D L L L F V A D R P A V V A A A L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L R L K L G K E L G L I D E T R L A F L W V T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
W P L L E Y D E E E G R Y Y A A H H P F T M P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R D D I P L L E T N P G A V R A Q A Y D L V L N
- - - - - - - - - - - - - - - - - A Y D L V L -
---------------------------------------------------GCGTACGATTTAGTGTTA---
481482483484485486487488489490491492493494495496497498499500501502503504
G Y E L G G G S L R I F E R D V Q E K M F Q A L
- - E L G G G S L R - - - - - - - - - - - - - -
------GAGCTCGGCGGCGGTTCGCTCCGC------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G F S K E E A R R Q F G F L L E A F E Y G T P P
- - - - - - - - - - - - - - - - - - - - - - P P
------------------------------------------------------------------CCGCCG
529530531532533534535536537538539540541542543544545546547548549550551552
H G G I A L G L D R L V M L L A G R T N L R D T
H G G I A L G L D R L V M L - - - - - - - - - -
CATGGCGGCATCGCCCTCGGCCTCGACCGGCTCGTCATGCTG------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I A F P K T A S A S C L L T E A P G P V S E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590
L E E L H L A V V L P R E E
- - - - - - - - - - - - - -
------------------------------------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_asp_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L R T H T C G E L R R D H I D Q T V T L A G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V H R R R D H G T V L F L D L R D R Y G L T Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I V D P S S N P E A R A M L D S I K N E Y V I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V T G R V R S R L E G A E N A N L A T G A I E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E V Q S A K I L N T A K T P P I L V N R D G G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D E A L R L K Y R Y I E L R R E R Q Q H I L G L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------TGG
145146147148149150151152153154155156157158159160161162163164165166167168
R H R T I K F M R D W M D R E G F W E I E T P I
R H R T I K F M R D W M D R E G F W E I E T P I
ATGGTGAGCGGCATCCCATTCGCCACTTTCGGCATTGTATTCAAACATTGGGAAGTCGATTACCCAGGCAAA
169170171172173174175176177178179180181182183184185186187188189190191192
L M K S T P E G A R D Y L V P S R L H P G E F Y
L M - - - - - - - - - - - - - - - - - - - - - -
ATGCAT------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A L P Q S P Q Q L K Q L L M V S G I D K Y F Q I
A L P Q S P Q Q L K Q - - - - - - - D K Y F Q I
TACCACTGCTGGTTTGTCGGCAACATAGACAAT---------------------CGTTGCACTCTTTAATTG
217218219220221222223224225226227228229230231232233234235236237238239240
A R C M R D E D L R A D R Q P E F T Q L D I E M
A R C M R D - - - - - - - - P E F T Q L D I E M
ATCAAGTTGGGCTTGCTC------------------------CACGCTGCCATCAGCTTCGATCGCCATCCA
241242243244245246247248249250251252253254255256257258259260261262263264
S F V E Q D D V L D V V E R L M T E L V A N V T
S - - - Q D D V L D V V E R L M T - - - - - - -
AGC---------GGCTCCACCAATTTTGGCAACTTCTTGCAGATCGTCGAT---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P H K R L V S P F P R L T Y A D A I E Y Y G S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K P D L R Y D L K F V N V G E I V K D S Q F G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F T G A L S S G G K V Q A I R L P G C G S Y S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K Q I D D L Q E V A K I G G A K G M A W M A I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A D G S V R S P I A K F F E Q A Q L D Q L K S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T A A E A G D L I V Y V A D K P A V V A A S L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K V R R E M A K R L D L A D K D L M H F A W V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D F P M F E Y N A E S G E W D A A H H P F C M V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N P A D V E K M Q R G E F E G V R A A S Y D L V
- - - - - - - - - - - - - - - - - - - S Y D L V
---------------------------------------------------------CTCGCCACCATCACG
481482483484485486487488489490491492493494495496497498499500501502503504
C N G Y E L A S G S I R I H D R S I Q Q Y I F D
C - - - E L A S G S I R - - - - - - - - - - - -
ATT---------TGGCGGAGTTTTGGCAGTGTTGAG------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
R L P Y S P E E I Q K R F G H M L E A F E Y G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P P H G G M A P G I D R L V M L L A D T D N I R
P P H G G M A P G I D R L V M L - - - - - - - -
ATTTTTGATGCTATCGAGCATAGCGCGAGCTTCGGGATTCGACGAAGG------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D V I A F P K T Q R A E D L M M N A P S S V D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594
K Q L R E L G L R L A D G V E P R G
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_asp_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T S P L K R T L T R E L P Q H E G Q T V K L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G F V H A R R D L G G V Q F L V L R D V T G V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q C V G S G L T L P L A E S S V E V V G K V K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H P K A P G G F E V Q V E D F R V I S A A T E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T P V E I P K M E W N V N P E T M L D Y R V V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V R G L K E R A A L K V Q A E L V D A F R A H L
- - - - - - - - - - - V Q A E L V D A F R A H L
---------------------------------GAGCAGGCGCTCGGCTTCGGGGTCGAGGTCTTTGCCGCC
145146147148149150151152153154155156157158159160161162163164165166167168
R G E G F T E I S T P K I V S A G A E G G A N L
R G E G F T E I S T P K I V - - - - - - - - - -
GACCGGGTGGCCGTATTTTTCCGTCACCAGTTGCCGGGCGTC------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F P I D Y F G H P A Y L A Q S P Q L Y K Q I M V
- - - - - - - - - - Y L A Q S P Q L Y K Q - - -
------------------------------AAACTCGGCCTGCGAGGTGGCCCGCAGCCGCTC---------
193194195196197198199200201202203204205206207208209210211212213214215216
G V F E R V F E V A A V Y R A E E H A T S R H L
- - - E R V F E V A A V Y R A - - - - - - - - -
---------GCGGTTCTCGAGGCCCATCACGTCTTCCTCGTCCTC---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N E Y L S L D V E M G F I E D E E D V M G L E N
N E Y L S L D V E M G - - - - E E D V M G L E N
CAGGTATTCGTTGAGGTGACGGCTGGTGGCGTG------------GTAGACGGCGGCGACTTCGAAGACGCG
241242243244245246247248249250251252253254255256257258259260261262263264
R L L A S I M E R L R A T S Q A E F E L L G A T
R L L A - - - - - - - - - - - - - - - - - - - -
CTCGAACACGCC------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I P D V P A H I P R I T L M D A R Q L V T E K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G H P V G G K D L D P E A E R L L S Q H F A E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E G S D F V F V T K Y P R A A R P F Y A H P E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N E D G S V N G E V T R G F D L L F R G I E I T
- - - - - - - - - - - - G F D L L F - - - E I T
------------------------------------GCGGAAGTCTTCCACCTG---------GCCGCCGGG
361362363364365366367368369370371372373374375376377378379380381382383384
S G G Q R I H D Y G M L M D S I A A Y K L K P E
S G G Q R - - - - - - - - - - - - - - - - - - -
CGCTTTGGGGTGGGC---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S L E G Y T E V F K Y G M P P H G G F A I G A E
- - - - - - - - - - - - - P P H G G F A I G A E
---------------------------------------CAAAAATTGCACGCCCCCCAGGTCGCGGCGGGC
409410411412413414415416417418419420421422423424425426427428429430431432
R L T A K L L G I A N V R Y A R A F P R D R H R
R L T A K - - - - - - - - - - - - - - - - - - -
GTGGACGAAGCCTTG---------------------------------------------------------
433434435
L T P
- - -
---------
Class II
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_asp_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L R T H T C G E L R A T D E G K K V K L C G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V D R I R D L G G V R F I D L R D R Y G E T Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V C D V N S E A Y S V V D E L T R E S V V L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G T V R K R P E G T E N P N I E T G E I E V V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E R I E I L S L A D P L P F Y P G E T P K E E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R L K Y R Y I D L R S E R M K R N I I L R Y R I
- - - - - - - - - - - - - - - - - - - L R Y R I
---------------------------------------------------------TTGAGATACAGAATA
145146147148149150151152153154155156157158159160161162163164165166167168
S K I I R D Y F D E L G F L E I E T P F L T R S
S K I I R D Y F D E L G F L E I E T P F L T - -
TCGAAAATCATCAGAGATTACTTTGATGAACTCGGTTTCCTTGAAATAGAAACTCCCTTTCTCACA------
169170171172173174175176177178179180181182183184185186187188189190191192
T P E G A R D F L V P S R L R P G K F Y A L P Q
- - - - - - - - - - - - - - - - - - - - A L P Q
------------------------------------------------------------GCGCTGCCTCAA
193194195196197198199200201202203204205206207208209210211212213214215216
S P Q L F K Q I L M I S G F D R Y F Q I V R C F
S P Q L F K Q - - - - - - - D R Y F Q I V R C F
TCTCCTCAGCTCTTCAAGCAG---------------------GACAGATACTTCCAGATAGTCAGATGCTTC
217218219220221222223224225226227228229230231232233234235236237238239240
R D E D L R A D R Q P E F T Q V D V E M S F V D
R D - - - - - - - - P E F T Q V D V E M S - - -
AGGGAC------------------------CCGGAGTTCACCCAGGTTGACGTGGAGATGTCC---------
241242243244245246247248249250251252253254255256257258259260261262263264
V E D V L N V S E G M V S R V F K E S S G I D L
V E D V L N V S E G M V S - - - - - - - - - - -
GTGGAAGATGTACTGAATGTGAGCGAAGGAATGGTTTCA---------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K V P F D R I P Y D D A M E K Y G T D K P D R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y G M E L R D F G Y A F E T T E F K V I R N V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N E G G S V K G F I V P G F A S E M S R K K G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E L M A R M K E L G L G G L I W F K L D G G I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S P H L K H L E K E F R K I A E T E N M N E G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V C L I A A H T D R N L L N E A L G T L R L E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G K E H F S H L A K G F D V L W V V D F P Y F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
W S E E E E R F V A R H H P F T M P V L E T L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D D Y T K V R A K A Y D L V I N G Y E V G G G S
- - - - - - - - - A Y D L V I - - - E V G G G S
---------------------------GCCTACGATCTCGTCATC---------GAAGTCGGTGGAGGAAGC
481482483484485486487488489490491492493494495496497498499500501502503504
I R I H R R D I Q E K I F E L L G L S E E E A Q
I R - - - - - - - - - - - - - - - - - - - - - -
ATCAGG------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K K F G F F L E A F R Y G V P P H G G I A F G L
- - - - - - - - - - - - - - P P H G G I A F G L
------------------------------------------CCGCCGCACGGCGGGATAGCTTTCGGACTG
529530531532533534535536537538539540541542543544545546547548549550551552
D R L V S I I A G E S S I R E V I A F P K T G N
D R L V S I - - - - - - - - - - - - - - - - - -
GATCGATTGGTGAGCATC------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G V C L L T G A P A E V D E R Q L R E L R I R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579
E E G
- - -
---------
Class II
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_asp_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L T E Y G D F K R T K Y C G E V S E E D I G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E V K L A G W V H R K R H H G G V I F I D L R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R E G I V Q V V V E E K T N P E A Y E V A D K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K S E Y V I G V V G K V R K R P E G T E N P K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K T G Y V E V V A D R I L V F N T S E A L P F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V E E E T H V S E E T K L K Y R Y I D L R R E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M K N N L I F R H R V Y Q I T R N F F T K E G F
- - - - - - F R H R V Y Q I T R N F F T K E G F
------------------TTCAGACACAGGGTTTACCAGATAACTAGAAACTTCTTCACAAAAGAGGGTTTT
169170171172173174175176177178179180181182183184185186187188189190191192
I E I E T P F L T K S T P E G A R D F L V P S R
I E I E T P F L T - - - - - - - - - - - - - - -
ATAGAAATAGAAACTCCCTTCCTTACA---------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L H P G K F Y A L P Q S P Q L F K Q I L M I A G
- - - - - - - A L P Q S P Q L F K Q - - - - - -
---------------------GCCCTTCCTCAATCTCCTCAGCTATTTAAACAA------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F D R Y F Q I V K C F R D E D L R A D R Q P E F
- D R Y F Q I V K C F R D - - - - - - - - P E F
---GACAGGTACTTCCAGATAGTAAAGTGTTTCAGGGAC------------------------CCCGAATTT
241242243244245246247248249250251252253254255256257258259260261262263264
T Q I D Y E M S F V S E E E V M D V A E R L I A
T Q I D Y E M S - - - E E E V M D V A E R L I A
ACCCAGATAGATTACGAGATGTCC---------GAAGAAGAGGTAATGGATGTTGCGGAAAGACTTATCGCC
265266267268269270271272273274275276277278279280281282283284285286287288
T L F K E L L G V E L K T P F E R I S Y R E A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E K Y G T D K P D R R F G L E L I E L T D I F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N T A F K V F K S V V E A G G I I K A I N F K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S N L S R K E I D E L T K F V Q S L G A K G L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
W I K V E K D K L T S P I V K F F T E E E T Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L L E R T K A E P G D V I L F S A D K K E M V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K I L G N L R L H L G K K Y K L I D E S K W D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F W I V D F P L M E W D E E E E R F V S L H H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F T M P R E E N I P K L K E A L E E E D L E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K E I V H S V R A R A Y D M V L N G E E I G G G
- - - - - - - - - - A Y D M V L - - - E I G G G
------------------------------GCTTACGACATGGTCCTG---------GAAATAGGCGGAGGT
505506507508509510511512513514515516517518519520521522523524525526527528
S I R I H R R D I Q E V V F K L L G I G E V E A
S I R - - - - - - - - - - - - - - - - - - - - -
TCTATACGT---------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Q E K F G F L L E A L K Y G A P P H G G L A F G
- - - - - - - - - - - - - - - P P H G G L A F G
---------------------------------------------CCTCCCCACGGTGGACTTGCCTTCGGG
553554555556557558559560561562563564565566567568569570571572573574575576
L D R V V A L M L G L D S I R D T I A F P K T Q
L D R V V A L - - - - - - - - - - - - - - - - -
CTTGATAGGGTAGTGGCTTTG---------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R G I C P L T G A P D Y V D P K Q L K E L H I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603
V L E
- - -
---------
Class II
Bacteria/Mycobacterium smegmatis/amino acid sequences/Msmegmatis_asp_aa
Bacteria/Mycobacterium smegmatis/nucleotide sequences/Msmegmatis_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L R T H A A G S L R P A D A G Q T V T L A G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V A R R R D H G G V I F I D L R D A S G V S Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V F R E G D V L A A A H R L R A E F C V A V T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V V E V R P E G N E N P E I P T G Q I E V N A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L T V L G E S A P L P F Q L D E Q A G E E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L K Y R Y L D L R R E G P G N A L R L R S K V N
- - - - - - - - - - - - - - - - - - L R S K V N
------------------------------------------------------CTGCGGTCGAAGGTCAAC
145146147148149150151152153154155156157158159160161162163164165166167168
A A A R S V L A E H D F V E I E T P T L T R S T
A A A R S V L A E H D F V E I E T P T L T - - -
GCCGCCGCACGGTCCGTGCTCGCCGAACACGACTTCGTCGAGATCGAGACCCCGACGCTGACG---------
169170171172173174175176177178179180181182183184185186187188189190191192
P E G A R D F L V P A R L Q P G S F Y A L P Q S
- - - - - - - - - - - - - - - - - - - A L P Q S
---------------------------------------------------------GCGCTGCCGCAGAGC
193194195196197198199200201202203204205206207208209210211212213214215216
P Q L F K Q L L M V A G M E R Y Y Q I A R C Y R
P Q L F K Q - - - - - - - E R Y Y Q I A R C Y R
CCGCAGCTGTTCAAGCAG---------------------GAGCGCTACTACCAGATCGCACGCTGCTACCGC
217218219220221222223224225226227228229230231232233234235236237238239240
D E D F R A D R Q P E F T Q L D M E M S F V E A
D - - - - - - - - P E F T Q L D M E M S - - - A
GAC------------------------CCCGAGTTCACCCAGCTCGACATGGAGATGAGC---------GCC
241242243244245246247248249250251252253254255256257258259260261262263264
D D V I A I S E Q V L K A V W A T I G Y D L P L
D D V I A I S E Q V L K - - - - - - - - - - - -
GACGACGTCATCGCGATCTCCGAGCAGGTCCTCAAG------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P L P R I S Y E E A M R R F G S D K P D L R F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I E L V E C T E Y F K D T T F R V F Q A P Y V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A V V M P G G A S Q P R R T L D G W Q E F A K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R G H K G L A Y V L V G E D G T L G G P V A K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L S D A E R D G L V A H V G A N P G D C I F F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A G P A K G A R A L L G A T R I E I A K R L D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I D P N A W A F T W V V D F P M F E A A D E A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A A G D V A V G S G A W T A M H H A F T A P K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D S V D T F D S D P G N A L S D A Y D I V C N G
- - - - - - - - - - - - - - - - A Y D I V C - -
------------------------------------------------GCCTACGACATCGTGTGC------
481482483484485486487488489490491492493494495496497498499500501502503504
N E I G G G S I R I H R R D I Q E R V F A M M G
- E I G G G S I R - - - - - - - - - - - - - - -
---GAGATCGGTGGCGGCTCGATCCGT---------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I D H D E A Q E K F G F L L D A F S Y G A P P H
- - - - - - - - - - - - - - - - - - - - - P P H
---------------------------------------------------------------CCGCCGCAC
529530531532533534535536537538539540541542543544545546547548549550551552
G G I A F G W D R I T A L L A G V D S I R E V I
G G I A F G W D R I T A L - - - - - - - - - - -
GGCGGCATCGCGTTCGGCTGGGATCGCATCACCGCACTG---------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A F P K S G G G V D P L T D A P A P I T P Q Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598
K E S G I D A K P R E D K P K E D A K S K A
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_asp_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K T I L N N T I T I K H V D E K V T V Y G F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E K I R K L G E I I F V D L R D E S G I L Q I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F E S S N I D F T K E S I L E I I G I V S K R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S I N T N L Q T G E I E I K V N S Y K V L S L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E L P F E I N S S N E T N E E L R L K Y R F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D L R S K K L Q E N I R L R H K V T R S M R N F
- - - - - - - - - - - - L R H K V T R S M R N F
------------------------------------CTAAGACACAAAGTCACTAGATCAATGCGTAATTTT
145146147148149150151152153154155156157158159160161162163164165166167168
L D R N N Y I N I E T P N L G R I T P E G A K D
L D R N N Y I N I E T P N L G - - - - - - - - -
TTAGATAGAAATAATTATATTAATATAGAAACACCAAATTTAGGA---------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F I V P S R K K G F F F S L P Q S P Q L Y K Q L
- - - - - - - - - - - - S L P Q S P Q L Y K Q -
------------------------------------TCTTTACCTCAATCACCACAATTGTATAAACAA---
193194195196197198199200201202203204205206207208209210211212213214215216
L M A S G F E K Y Y Q I A R A F R D E K S R K D
- - - - - - E K Y Y Q I A R A F R D - - - - - -
------------------GAAAAATATTATCAAATAGCAAGAGCTTTTAGGGAT------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R Q L E F T Q L D I E M A Y A K E E I V I H L I
- - L E F T Q L D I E M A - - - E E I V I H L I
------CTTGAATTCACACAATTAGATATTGAAATGGCT---------GAAGAAATTGTAATTCATTTAATT
241242243244245246247248249250251252253254255256257258259260261262263264
E N L F K E I F T D L N I D I K I P F P K M N Y
E N L F K - - - - - - - - - - - - - - - - - - -
GAAAATCTTTTTAAA---------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D D A L N Q Y G S D K P D L R Y E Y K L Q D F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H L I P K F N S K V F K N V K S L K I I I I P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N I T K K Q F E F L E E E A K Q N H S K G L L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A N F E K N K A I S G N F F Q F F K S E L E I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q G E L K H N F K E K F A I L A I A D D L E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N Q A L G S V R V K L D E F F D F E K K D F A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T W V I N W P L Y E F D K E V N K F Q A A H H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F T M P Q L E Y L D N F D K K P M E A K S R A Y
- - - - - - - - - - - - - - - - - - - - - - A Y
------------------------------------------------------------------GCTTAT
457458459460461462463464465466467468469470471472473474475476477478479480
D I V L N G Y E V G G G S I R I N D L E I Q K R
D I V L - - - E V G G G S I R - - - - - - - - -
GATATTGTTTTA---------GAAGTTGGCGGAGGTTCAATTAGA---------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M F R T L G L S E K Q I E E Q F D F F L T A F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Y G F P P H G G I A L G I D R L L S I L T N S T
- - - P P H G G I A L G I D R L L S I - - - - -
---------CCGCCTCATGGAGGAATTGCTTTAGGAATCGATAGATTACTTTCAATT---------------
529530531532533534535536537538539540541542543544545546547548549550551552
S I R D V I A F P K N S K G I D P F T K A P S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567
L E N E L L K E Y G I I I K E
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_asp_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F K V I K C N E L N E K L I D K K V E I N A W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V K K I R H H G K F I F L N I R D R Y E K A Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L V N E E K L L K I A E K I K L E Y C I K I Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L L I K R P P N M I N A N M K T G H F E I L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N I E I I S K C N E L P F M I E D D N N A S E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S K L E Y R Y L D L R R D S L K N K I I L R C Q
- - - - - - - - - - - - - - - - - - - - L R C Q
------------------------------------------------------------GTGGTGAGCTGG
145146147148149150151152153154155156157158159160161162163164165166167168
A T H L I R N F L I K R K F L E L E T P T F V K
A T H L I R N F L I K R K F L E L E T P T F V -
TGAATAGGTTTTTGTATTTTCGTCATATTCAAATAGTGGAAAATCATAGACCCATAGAAATTCAAATTT---
169170171172173174175176177178179180181182183184185186187188189190191192
S T P E G A R D F V I P S R I H K G S F Y A L P
- - - - - - - - - - - - - - - - - - - - - A L P
---------------------------------------------------------------AGTTTCCCA
193194195196197198199200201202203204205206207208209210211212213214215216
Q S P Q L Y K Q L I M I A G F D K Y F Q I A R C
Q S P Q L Y K Q - - - - - - - D K Y F Q I A R C
GTTATTATTAGCTGTAAAGAAAAT---------------------ATAGGTTTTTATTAATTCCTGTTCTTC
217218219220221222223224225226227228229230231232233234235236237238239240
Y R D E D S R G D R Q P E F T Q L D L E M S F V
Y R D - - - - - - - - P E F T Q L D L E M S - -
TGTTTTTAA------------------------TTTATTGTTTTCAATTTTTGTAAAATAAAGCCC------
241242243244245246247248249250251252253254255256257258259260261262263264
K K E N I F K L I E N M L F L I F K N C I N I N
- K E N I F K L I E N M L F - - - - - - - - - -
---GTAAAGCTTTGCAATTTCTTCTAAATTGTTTATTTTTGC------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L P K K F K K I T Y K K A M N K Y G S D K P D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R F E L E L Q D I S R N L K N S E F N I F K D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L K N K G S I K I L I V K D K A D K F S R A K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N N L E E I A K L Y K T Q G L Y F T K I E N N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F S G G I A K F L K T E E Q E L I K T Y S L E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N D I I F F T A N N N W E T A C K A M G Q I R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K I A N D L G L I D E N K F E F L W V Y D F P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F E Y D E N T K T Y S P A H H M F S L P K K Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I A N L E K N P K K T I G E I Y D L V L N G V E
- - - - - - - - - - - - - - I Y D L V L - - - E
------------------------------------------TGCATTATTGTCATCTTC---------TGG
481482483484485486487488489490491492493494495496497498499500501502503504
L G S G S I R I H N K E L Q Q R I F K I I G F Q
L G S G S I R - - - - - - - - - - - - - - - - -
CAATTCATTGCACTTTGAGAT---------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K E K S E D R F G F F L K A L E Y G A P N H G G
- - - - - - - - - - - - - - - - - - - P N H G G
---------------------------------------------------------AAGTTTTATTTTTTC
529530531532533534535536537538539540541542543544545546547548549550551552
I A I G I D R L I M L M T K S T S I K D V I L F
I A I G I D R L I M L - - - - - - - - - - - - -
TGCGATCTTTAGAAGCTTTTCTTCATTTACCAG---------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P K N S F A A S P L D N S P S K I S N E Q L K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586
L G I N I V D G D N
- - - - - - - - - -
------------------------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_asp_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L R T H T C G E L R L Q H I G I S V T L C G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V Q K I R N K G S L V W I D L R D R Y G I T Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I L E E H I T A P E I L S Q V Q H I G R E Y V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q A T G S V I E R S A K N P S M P T G D I E I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V K S L T I L N T A K T P P F L I E E Q T D G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E E L R M Q Y R Y L D L R R P P L Q K N L L L R
- - - - - - - - - - - - - - - - - - - - - - L R
------------------------------------------------------------------ATAACG
145146147148149150151152153154155156157158159160161162163164165166167168
Q L V A Q H A R A Y L E Q H H F V D V E T P L L
Q L V A Q H A R A Y L E Q H H F V D V E T P L L
CTGAGACTCTTCATTCCATTCTAAAAGTGGGAAGTCTACCACCCACAAAGGAGCAAATTTATCTTTAGAAAC
169170171172173174175176177178179180181182183184185186187188189190191192
I K S T P G G A R D F V V P S R I H P Q Q F Y A
I - - - - - - - - - - - - - - - - - - - - - - A
TAA------------------------------------------------------------------AGC
193194195196197198199200201202203204205206207208209210211212213214215216
L P Q S P Q I F K Q L L M V A G L D R Y Y Q I A
L P Q S P Q I F K Q - - - - - - - D R Y Y Q I A
CAAAATAAGTAATAAGTCGCCTGGAACTGC---------------------TGTTAGTTGTTCAACATCATA
217218219220221222223224225226227228229230231232233234235236237238239240
K C F R D E D F R A D R Q P E F T Q I D C E L S
K C F R D - - - - - - - - P E F T Q I D C E L S
GAATTTACTTACTGG------------------------ATATTTTACATACACCAACCCACTTGTAACAAG
241242243244245246247248249250251252253254255256257258259260261262263264
F V T Q A D I L H I F E N F T K Y I F E A T I Q
- - - Q A D I L H I F E N F T K - - - - - - - -
---------CTTTATATATTCTGTAAGATCATCTAGCTGCTTCCTAGT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V R L D K F P C I T Y A E A M Q K Y G T D K P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I R F G M R L I E L T E L V K N S E F P L F K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A K L I A G I C V K G C A D Y T R K Q L D D L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E Y I K K L N L V T S G L V Y V K Y L A D G S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N S P V S K F Y D V E Q L T L W A K Q M H A V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G D L L L I L A G E I E A T Q I A L G S L R L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L R D E L H L V S K D K F A P L W V V D F P L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E W N E E S Q R Y V S R H H P F T S P K Q E D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E L L S T K P E T V R A N A Y D L V I N G M E I
- - - - - - - - - - - - - A Y D L V I - - - E I
---------------------------------------TTCAATTAAAAAAGGAGG---------TGTATT
481482483484485486487488489490491492493494495496497498499500501502503504
G G G S I R I H D R A L Q E Q I F N V L G F S E
G G G S I R - - - - - - - - - - - - - - - - - -
AAGAATAGTAAGCGACTT------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E E A R Q Q F G F L T D A F E Y G A P P H G G I
- - - - - - - - - - - - - - - - - - P P H G G I
------------------------------------------------------GCTTAAGATTTCTGGTGC
529530531532533534535536537538539540541542543544545546547548549550551552
A F G F D R L C A I I G R E D S I R P F I A F P
A F G F D R L C A I - - - - - - - - - - - - - -
TGTTATATGCTCTTCTAAAATAAGTTGTGT------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K N N A G R D V M M K A P S T I T E Q Q I S E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582
G I I L S K
- - - - - -
------------------
Class II
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_asp_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K R T T Y C G L V T E A F L G Q E I T L K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W V N N R R D L G G L I F V D L R D R E G I V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V V F N P A F S E E A L K I A E T V R S E Y V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E V Q G T V T K R D P E T V N P K I K T G Q V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V Q V T N I K V I N K S E T P P F S I N E E N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N V D E N I R L K Y R Y L D L R R Q E L A Q T F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K M R H Q I T R S I R Q Y L D D E G F F D I E T
- M R H Q I T R S I R Q Y L D D E G F F D I E T
---CGCATCTTCATCATATTCTAATAATGGCCAATCTGTCACCCATAAGAAGTTTAATTTTGTTTCATCGAT
169170171172173174175176177178179180181182183184185186187188189190191192
P V L T K S T P E G A R D Y L V P S R V H D G E
P V L T - - - - - - - - - - - - - - - - - - - -
TAAACCTAATTC------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F Y A L P Q S P Q L F K Q L L M I S G F D K Y Y
- - A L P Q S P Q L F K Q - - - - - - - D K Y Y
------CATTACTAAGTCACCAGCTTCAGCACCAGTTAA---------------------TTCTGCCTCAAA
217218219220221222223224225226227228229230231232233234235236237238239240
Q I V K C F R D E D L R A D R Q P E F T Q V D I
Q I V K C F R D - - - - - - - - P E F T Q V D I
GAAACGTCCAATTGGACCTGTCAA------------------------TGCTAATCCTTTAGCACCATAGAT
241242243244245246247248249250251252253254255256257258259260261262263264
E M S F V D Q E D V M Q M G E E M L K K V V K E
E M S - - - Q E D V M Q M G E E M L K - - - - -
GTTTACAAA---------AGCATCCATATCTTTACGTGTATATTGTTCAGCTGCACC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
V K G V E I N G A F P R M T Y K E A M R R Y G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D K P D T R F E M E L I D V S Q L G R D M D F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V F K D T V E N D G E I K A I V A K G A A E Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T R K D M D A L T E F V N I Y G A K G L A W V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V V E D G L T G P I G R F F E A E N V E T L L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L T G A E A G D L V M F V A D K P N V V A Q S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G A L R V K L A K E L G L I D E T K L N F L W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T D W P L L E Y D E D A K R Y V A A H H P F T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P K E A D I A K L G T A P E E A E A N A Y D I V
- - - - - - - - - - - - - - - - - - - A Y D I V
---------------------------------------------------------AGAAAATGGTGGTGT
481482483484485486487488489490491492493494495496497498499500501502503504
L N G Y E L G G G S I R I H D G E L Q E K M F E
L - - - E L G G G S I R - - - - - - - - - - - -
CTC---------AATCACTTTAATATTTGTAACTTG------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V L G F T K E Q A Q E Q F G F L L D A F K Y G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
P P H G G I A L G L D R L V M L L T N R T N L R
P P H G G I A L G L D R L V M L - - - - - - - -
TTTCAATGCCTCTTCTGAAAATGCAGGATTAAACACAACTTGTACAAT------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D T I A F P K T A S A T C L L T N A P G E V S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588
K Q L E E L S L R I R H
- - - - - - - - - - - -
------------------------------------
Class II
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_asp_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I K M A D P A P Q Q P A E L S K K A L K K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A K E A E K Q A K R A E N K S K Q A G V D F A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A Y I P P V L T T A Q F R R L R F G D A P L H M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S Q P E L S S F R K L T D I D R P L T H L V G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K V W V R A R I H T V R A T G K S A F L M L R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K M A I L Q A C C F V P G K S E G S A E K V D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y R A M I K Y I N S L P P E S V V E V C G A L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S V D A P I K T A S A E H R D Y E L Q L E K I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A I S R A A S Q M P L Q V D D A M R P D S V Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A P D S Q Y V R P G K D T K Q D Y R V I D L R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P T N Q A I M R V R S A I A H E F R S F L D K A
- - - - - - - - V R S A I A H E F R S F L D K A
------------------------GTGAGGAGCGCAATTGCGCACGAATTCCGATCCTTCCTGGATAAGGCT
265266267268269270271272273274275276277278279280281282283284285286287288
G F I E I N T P K I V A G T S E G G A A V F N V
G F I E I N T P K I V - - - - - - - - - - - - -
GGCTTCATTGAAATCAATACCCCCAAGATAGTT---------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N Y F N T K A C L A Q S P Q L Y K Q M C I S S G
- - - - - - - C L A Q S P Q L Y K Q - - - - - -
---------------------TGCTTGGCCCAGTCGCCGCAGCTCTACAAGCAG------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F G R V Y E V G P V F R A E H S H T H R H L C E
- G R V Y E V G P V F R A - - - - - - - - - C E
---GGTCGTGTGTATGAAGTTGGGCCTGTCTTTAGAGCT---------------------------TGTGAG
337338339340341342343344345346347348349350351352353354355356357358359360
F I G L D L E M E I Y E S Y T E I L V L L G D L
F I G L D L E M E - - - - Y T E I L V L L G D L
TTCATCGGTCTTGATTTAGAAATGGAG------------TACACGGAGATCCTTGTCCTGTTAGGGGATCTT
361362363364365366367368369370371372373374375376377378379380381382383384
M K H I F K A V E A R C S K E M S I V R T Q Y D
M K - - - - - - - - - - - - - - - - - - - - - -
ATGAAG------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L T A P E P L V W A D E T V I V T F C D G I K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L Q E A G Y E A S P L D D L S T E N E R A L G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L I K E K Y N T D F Y I L D K F P L N A R P F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T M P D P H D G R Y S N S Y D M F I R G E E I C
- - - - - - - - - - - - S Y D M F I - - - E I C
------------------------------------AGTTATGACATGTTCATT---------GAGATATGC
481482483484485486487488489490491492493494495496497498499500501502503504
S G A Q R V H D P E L L E K Q C R E R N V D P E
S G A Q R - - - - - - - - - - - - - - - - - - -
TCAGGGGCCCAGCGT---------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S L R S Y I D A F R Y G C A P H G G A G L G L E
- - - - - - - - - - - - - A P H G G A G L G L E
---------------------------------------GCACCACATGGCGGGGCAGGACTTGGTCTGGAA
529530531532533534535536537538539540541542543544545546547548549550551552
R I V M L M L G I E N C R Q T C L F P R T Q E R
R I V M L - - - - - - - - - - - - - - - - - - -
AGGATCGTTATGCTG---------------------------------------------------------
553554555
L T P
- - -
---------
Class II
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_asp_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N S N H A D A G A P A M E K K M S D K E A R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A A R L A E E K A R A E E K A A L V E K Y K D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F G A A P M V Q S T T Y K S R T H I P V A K L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q P E L V S K T V L I R A R V S T T R K K G K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A F M V L R D G S D S V Q A M A A V E G N V P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E M I D F M G Q I A T E S I V D V E A T V C K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E Q P I T S T S H S D I E L K V K K I H T V T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L R T L P F T L E D A S R K E S D E G A K V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L D T R L N S R W M D L R T P A S G A I F R L Q
- - - - - - - - - - - - - - - - - - - - - - L Q
------------------------------------------------------------------GTGAGT
217218219220221222223224225226227228229230231232233234235236237238239240
S R V C Q Y F R Q F L I D N D F C E I H S P K I
S R V C Q Y F R Q F L I D N D F C E I H S P K I
GGCAAGGTGCTCGAAAATGTAGTTGAATAGGCTCTCCGCCACATCCAGCACCTCGTAGTAGTGCTCATCGAT
241242243244245246247248249250251252253254255256257258259260261262263264
I N A P S E G G A N V F K L E Y F N R F A Y L A
I - - - - - - - - - - - - - - - - - - - - Y L A
GCG------------------------------------------------------------GCGGAACAC
265266267268269270271272273274275276277278279280281282283284285286287288
Q S P Q L Y K Q M V L Q G D V P R V F E V G P V
Q S P Q L Y K Q - - - - - - - P R V F E V G P V
CGGTCCCACCTCGAACACGCGCGG---------------------CTGCTTGTACAGTTGTGGCGACTGGGC
289290291292293294295296297298299300301302303304305306307308309310311312
F R S E N S N T H R H L T E F V G L D V E M R I
F R S - - - - - - - - - T E F V G L D V E M R -
AAGGTACGC---------------------------CACGTTGGCGCCGCCCTCGCTTGGCGCGTTGAT---
313314315316317318319320321322323324325326327328329330331332333334335336
D E H Y Y E V L D V A E S L F N Y I F E H L A T
- - - Y Y E V L D V A E S L F N - - - - - - - -
---------GTGGATCTCACAGAAGTCGTTGTCGATAAGAAACTGGCG------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H T K E L K N V C Q Q Y P F E P L V W K L T P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K M K E L G V G V I S E N V V P T D K F Q A R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
H N M D S R M L R I N Y M H C I E L L N T V L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E K M A P T D D I N T T N E K L L G K L V K E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y G T D F F I S D R F P S S V R P F Y T M E C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D D V R F T N S Y D M F I R G E E I S S G A Q R
- - - - - - - S Y D M F I - - - E I S S G A Q R
---------------------CGACACGCGGGCACGGAT---------CTTGCTCACCAACTCCGGCTGCGA
481482483484485486487488489490491492493494495496497498499500501502503504
I H D P D L L L A R A K M L N V D L T P I K E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V D S F R L G A W P H G G F G V G L E R V V M L
- - - - - - - - W P H G G F G V G L E R V V M L
------------------------CGCCTTTTCCTCCGCGCGGGCCTTCTCCTCCGCCAGGCGCGCCGCCTT
529530531532533534535536537538539540541542543544545546547548549550
Y L G L S N V R L A S L F P R D P Q R T T P
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_asp_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S W E G R D R G C G T L R E D D V G Y S L T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
C G W V H R Q R N M G G V C F T D I R D S S G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V Q V V S Q D D S V G L D Q L R A E Y V V R I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G Q L R M R K D P N E R L P T G K V E L V A E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V T I L N T V N V K L P F L P S D E E L D V K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E V R L R T R V L D L R R P R M T K N L K L R H
- - - - - - - - - - - - - - - - - - - - - L R H
---------------------------------------------------------------CTGAGGCAC
145146147148149150151152153154155156157158159160161162163164165166167168
R M L R A I R N F L D D R E F L E V E T P L L C
R M L R A I R N F L D D R E F L E V E T P L L C
CGCATGCTGCGCGCGATCCGAAACTTTCTGGACGATCGGGAGTTTCTGGAGGTGGAAACGCCGCTGCTGTGC
169170171172173174175176177178179180181182183184185186187188189190191192
R S T P E G A R D F L V P S R M Q P G S F Y A L
- - - - - - - - - - - - - - - - - - - - - - A L
------------------------------------------------------------------GCACTC
193194195196197198199200201202203204205206207208209210211212213214215216
P Q S P Q L F K Q M L C C A G V E R Y Y Q I A R
P Q S P Q L F K Q - - - - - - - E R Y Y Q I A R
CCACAAAGCCCGCAGCTGTTCAAGCAG---------------------GAGAGATACTACCAGATTGCTCGG
217218219220221222223224225226227228229230231232233234235236237238239240
C F R D E D L R S D R Q P E F S Q L D M E M T F
C F R D - - - - - - - - P E F S Q L D M E M T -
TGCTTTCGGGAC------------------------CCAGAGTTCTCTCAGCTGGATATGGAGATGACA---
241242243244245246247248249250251252253254255256257258259260261262263264
M D Q N A I M S L V E E M V L A V F N E V L G M
- - Q N A I M S L V E E M V L - - - - - - - - -
------CAGAATGCCATCATGTCTCTAGTGGAGGAGATGGTCCTT---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P V Q R P F R R M T Y A E A M T S Y G C D K P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L R Y G L E H Y D V S S A V Q G C T F R V F S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A L E G E G I V K A M R V P D G K R I S N S R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K P K G D I S G E A V A A G A G G L V Y I R V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E G A E I D A A K P V K E G L S E E Q C H A L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S S T G A Q P G D L L L L A A G E P A V V H K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L D R V R Q Y V A A D L G E I D E S K H A L L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V T D F P M F E W N E E E D R L E A V H H P F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A P N P D D L E G N G A G L R G A R A L A Y D L
- - - - - - - - - - - - - - - - - - - - A Y D L
------------------------------------------------------------GCCTATGACCTT
481482483484485486487488489490491492493494495496497498499500501502503504
V Y N G V E V A G G S L R T Y R R D V L E R V F
V Y - - - E V A G G S L R - - - - - - - - - - -
GTCTAC---------GAGGTGGCAGGCGGGAGCCTGCGC---------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D A I G L S R E E A K A Q F G Y L L N A F D V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A P P H G G I A F G L D R L C M L L A R E S S I
- P P H G G I A F G L D R L C M L - - - - - - -
---CCTCCCCATGGCGGCATCGCGTTCGGCCTGGACCGGCTCTGCATGCTG---------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R D V I A F P K T A Q A S A S T K L R S T L H N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584
S P F A G W N A
- - - - - - - -
------------------------
Class II
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_asp_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R S H G C G D L R I T N V A N S V Q L S G W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D R F R D H G G V I F I D L R D Q S G T I Q I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V D P E Q G P E L F T Q A E H L R N E T V L K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E G M V A A R P T L S I N E R L S T G E I E V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A K S L T V L N S V N G T F P F S V S I H D D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N V R E E L R L R Y R Y L D L R R E R M N N N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R L R H N T V K A A R R F L E N E G F I E I E T
- L R H N T V K A A R R F L E N E G F I E I E T
---TTGCGTCACAATACTGTAAAAGCAGCACGCCGGTTTCTAGAAAATGAAGGTTTTATTGAAATAGAAACG
169170171172173174175176177178179180181182183184185186187188189190191192
P L L T R S T P E G A R D Y L V P S R V C G G E
P L L T - - - - - - - - - - - - - - - - - - - -
CCCCTTCTTACT------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W F A L P Q S P Q I F K Q L L M V G G I E R Y Y
- - A L P Q S P Q I F K Q - - - - - - - E R Y Y
------GCATTGCCTCAATCACCTCAAATCTTTAAACAA---------------------GAACGCTACTAC
217218219220221222223224225226227228229230231232233234235236237238239240
Q I A R C F R D E D L R A D R Q P E F T Q I D M
Q I A R C F R D - - - - - - - - P E F T Q I D M
CAGATAGCTAGATGTTTTCGTGAT------------------------CCAGAATTCACACAGATAGATATG
241242243244245246247248249250251252253254255256257258259260261262263264
E M S F M N Q K E I L R L N E S L I A S I W K E
E M S - - - Q K E I L R L N E S L I A - - - - -
GAAATGAGT---------CAGAAGGAAATACTAAGACTAAATGAATCCTTAATTGCA---------------
265266267268269270271272273274275276277278279280281282283284285286287288
V K D I E L Q L P F T R M T W H E A T E R Y G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D R P D A R Y G M E L V N I S D I V K N I E F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V F S S A I A N G G S V K C I A I P E G N D A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S N T R I K P G G D I L R E A E A S G A G G L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F I R V R E N G E I D S I G A I K N N L S E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K L E L L I R T G A E P G T L L L F G A G D T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T V N R V L N R V R Q Y I A R D L V L I A S A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D N K I W N F L W V T D F P M F E F N K E E N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L E A L H H P F C S P N L K D L G D D T A N Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K R L P N A R A Q A Y D L V L N G L E L G G G S
- - - - - - - - - A Y D L V L - - - E L G G G S
---------------------------GCATATGATCTAGTCCTT---------GAGTTAGGGGGAGGATCT
505506507508509510511512513514515516517518519520521522523524525526527528
L R I H N S E L Q K Q V L Q T I G L S A E E A Q
L R - - - - - - - - - - - - - - - - - - - - - -
CTACGT------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R Q F G F L M D A L N M G A P P H G G I A F G L
- - - - - - - - - - - - - - P P H G G I A F G L
------------------------------------------CCACCTCATGGTGGAATAGCATTTGGATTA
553554555556557558559560561562563564565566567568569570571572573574575576
D R L V M L L A G E E S I R D T I A F P K T Q Q
D R L V M L - - - - - - - - - - - - - - - - - -
GATCGTCTGGTAATGCTT------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A R C L M T Q A P S N V S N K Q L E E L Y V A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607
T W N P E K Q
- - - - - - -
---------------------
Class II
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_asp_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_asp_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S A V E M S F E N L N L E V P F I N L N N L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K S Y V D K A I K T R G F V C N I N V F K K T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F L T L R D Q N R T L Q C V L S T T E A A K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N N E S Y I E V E G K I C L V S T K I K S C S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E L E L Q L H T F A I L N A S E S V L P F S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K D V S Y T L E D L K K Y N V S P V S Y H L C L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D N R S L Y L R S P Q G Y A I T R I L D A V M F
- - - - - - - - - - - - - - - - - I L D A V M F
---------------------------------------------------ATCAGTAAACATAAATGGTTC
169170171172173174175176177178179180181182183184185186187188189190191192
K F R D F L R S N G F I E V K T P K L I G G A S
K F R D F L R S N G F I E V K T P K L I - - - -
AAACTCGAAATATTGCTTAATAGTTTCTAGCTCCGAAGAATAACTTTCGGATAAAAATAC------------
193194195196197198199200201202203204205206207208209210211212213214215216
E G G A N C F K V D Y F A K T A T L A Q S P Q L
- - - - - - - - - - - - - - - - T L A Q S P Q L
------------------------------------------------TTCCATCTCCAAATCCAAACCTAT
217218219220221222223224225226227228229230231232233234235236237238239240
Y K Q M C I L G G L K R V Y E I G H V Y R A E E
Y K Q - - - - - - - K R V Y E I G H V Y R A - -
AAACTCGCT---------------------TTCTTCAGCTCTGTAAACATGCCCTATTTCATAAAC------
241242243244245246247248249250251252253254255256257258259260261262263264
S N I N R Y L S E F I G L D L E M E I T D N Y I
- - - - - - - S E F I G L D L E M E - - - - Y I
---------------------TTGCTTGTAAAGCTGTGGACTTTGAGCTAAAGT------------AAAATA
265266267268269270271272273274275276277278279280281282283284285286287288
S V I N F I Y D L F K S I F V F L S E S Y S S E
S V I N F I Y D L F K - - - - - - - - - - - - -
GTCAACTTTAAAACAATTAGCACCACCTTCACT---------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L E T I K Q Y F E F E P F M F T D N P V I L D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I D C M K L L K D E Y N I D M K L E D D F N N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N E K K L G E I V K K K W N T D I F V I K D Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V C C R P F Y T A V D S K T G F T K S Y D F I I
- - - - - - - - - - - - - - - - - - S Y D F I I
------------------------------------------------------CGAGACCAAACAAATCTT
385386387388389390391392393394395396397398399400401402403404405406407408
R G E E I L S G A E R I N C Y K T L K E N I E R
- - - E I L S G A E R - - - - - - - - - - - - -
---------TTCAATATATGATTCATTATTAAG---------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
C G I N I S S L G G Y L E A F K I G A P P H G G
- - - - - - - - - - - - - - - - - - - P P H G G
---------------------------------------------------------ACACACAAATCCTCT
433434435436437438439440441442443444445446447448449450451452453454455456
C G I G L E R L V K A Y F G M K D I R Y F S L F
C G I G L E R L V K A - - - - - - - - - - - - -
TGTTTTAATCGCTTTGTCAACATAACTTTTATT---------------------------------------
457458459460461462463464465
P R D P N R L Y P
- - - - - - - - -
---------------------------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_gly_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S F E D V V E L A K R R G F F W P S F S I Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G S S G F Y D Y G P L G T L L K D N I I S I W K
- - - - - - - - - - - - - - L K D N I I S I W K
------------------------------------------CTTAAGGATAATATAATAAGTATCTGGAAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K S Y A K E G A I F L D T P V I A P A D V F K A
K S Y A K E G A I F L D T P V I A - - - - - - -
AAATCATACGCTAAGGAAGGGGCAATTTTCTTAGACACGCCGGTTATAGCG---------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S G H L E K F S D I A V K C E K C K T A Y K L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N L L K S V G I D V P L N N V E K A N A V L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y D V K C P K C G A P L R G A Y E F N L M F K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G T N E L Y L R P E T A Q G I F I N F K N L Y N
- - - - - Y L R P E T A Q G I F - - - - - - - -
---------------TACCTTAGGCCTGAGACTGCGCAAGGCATATTT------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y S R N T M P I I V C Q V G K G F R N E I S P R
- - - - - - - I I V C Q V G K G F R N - - - - -
---------------------ATAATAGTCTGCCAAGTCGGGAAAGGTTTCAGGAAT---------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q A L I R M R E F T Q A E V E V F Y L N D S D F
- - - - - - R E F T Q A E V E V F - - - - - - -
------------------AGGGAATTCACCCAGGCTGAAGTCGAGGTATTT---------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N P N G N S L K F K L L R N T G E E V T V D L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E A L H S G I V K N P V M A Y F L E K T Y S I L
- - - - - - - - - - - - M A Y F L E K T Y S I L
------------------------------------ATGGCCTATTTCCTCGAGAAGACATACAGCATACTC
265266267268269270271272273274275276277278279280281282283284285286287288
S S I G F N P N H L R A R E H D P L E R A H Y S
S - - - - - - - - - - - - - - - - - - - - - - -
TCT---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S E T W D F E Y L M D G E W I E I V G V S D R G
- - T W D F E Y - - - - - - - E I V G V S D R -
------ACTTGGGACTTCGAATAC---------------------GAGATAGTCGGGGTCTCTGATCGT---
313314315316317318319320321322323324325326327328329330331332333334335336
T Y D L G R H Q Q F S G E N M E V D G N I P R V
- - - - - - - - - - - - - - - - - - - - - P R V
---------------------------------------------------------------CCAAGGGTA
337338339340341342343344345346347348349350351352353354355356357358359360
V E P S Y G I D R I V L T I L N D G Y Y I R D N
V E P S Y G I D R I V L T - - - - - - - - - - -
GTAGAGCCCTCCTATGGGATAGATAGGATAGTCCTTACT---------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G Y K V L K L D P A V S P L H F A V F P L Q R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D G L D A K A K E L F N K I K Q I D P F V Y Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E G G N I G R R Y A R Q D E I G T P F C I T V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y E T L E D S T V T I R E R D S T K Q V R E N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476
E E L L Q K I S D Y P E Y P T S L F K N
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_gly_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S F D D V I E L A K R R G F F W P S Y M I Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G S S G F Y D Y G P L G T L L K D N I I A A W K
- - - - - - - - - - - - - - L K D N I I A A W K
------------------------------------------TTCATCATCCTTTGTCTGGTAATCAACCGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R E Y A R E G A I F L D T P V I S P A D V F R A
R E Y A R E G A I F L D T P V I . . . D - - - -
CACGCAGAAAGGAGTACCTATTTCGTCCTGTCTTGCGTATCTCCTGCC---------ACT------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S G H L E K F S D I A V K C S K C G T P Y K F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S L I K S L G I N E I A K T V D E A A A I L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y D V K C P K C G E K L K N P Y D F N L M F R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G S N D L Y L R P E T A Q G I F I N F K N L Y N
- - - - - Y L R P E T A Q G I . . . . . . . . .
---------------CTGAAAGTTTTCTCCGGAAAACTGCTGATG---------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y A R N S M P I I V C Q V G K G F R N E I S P R
. . . . . . P I I V C Q V G K G F R N - - - - -
------------------GGTCCAATCACCATCAAGGAGATATTCAAAATCCCATGT---------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q A L I R M R E F S Q A E V E V F Y I E N D D F
- - - - - - R E F S Q A E V E V F - - - - - - -
------------------ATGCTCCCTTGCCCTTATGTGATCCGGTTGGAA---------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P I P D S S V E L N M L R N T G D L L K M K V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D A L R S G I I G N R V M A Y F L N K T Y E I L
- - - - - - - - - - - - M A Y F L N K T Y E I L
------------------------------------AAGTTCAACGCTAGAATCAGGGATGGGGAAGTCATC
265266267268269270271272273274275276277278279280281282283284285286287288
L K L G F Q P D H I R A R E H D P G E R A H Y S
L - - - - - - - - - - - - - - - - - - - - - - -
GTT---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S E T W D F E Y L L D G D W T E I V G V S D R G
- - T W D F E Y - - - - - - - E I V G V S D R -
------GTTTCTGAACCCCTTACC---------------------CATTGAGTTTCTGGCGTAATTATA---
313314315316317318319320321322323324325326327328329330331332333334335336
T Y D L G R H Q Q F S G E N F Q I D G R T P K V
- - - - - - - - - - - - - - - - - - - - - P K V
---------------------------------------------------------------GACACGGAA
337338339340341342343344345346347348349350351352353354355356357358359360
V E P S Y G L D R I L L T I M D S S Y Y R R E N
V E P S Y G L D R I L L T - - - - - - - - - - -
CATAAGGTTGAAATCATATGGATTCTTCAGCTTTTCCCC---------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G Y K V L R L D P H I S P I H M A I F P L Q K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D D L D K I A K D L F E K M K N I D P F I F Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D S G N I G R R Y A R Q D E I G T P F C V T V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y Q T K D D E T V T I R E R D S T S Q V R V K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476
S D L L E R T R S F P D S L S A L F S N
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_gly_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D L K E Y V L K G F F Y P A S E I Y N S I A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F Y D Y G Y L G T L L K N N F I N E W K N Y F L
- - - - - - - - - - L K N N F I N E W K N Y F L
------------------------------AGTTTGGTAATCTATTGTTATTGCATAAGGTACCCCAATTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R L H P N F W E V D P A I V M P K E V F I A S G
R . . P N F W E V D P A I V M - - - - - - - - -
GTC------TCTGTACCTTCTCCCTATAGAGCCTTGTTCATCATA---------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H L E N F N D P I V E C K N G H R F R A D H L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E K L N I K A E G L S L S E M E E L L K N V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
C P I C N A P L G K V K W F N L M F P I Y I G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D S Q E A L N L L K N L K E N V S E Q Y I K D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I E R V K K M V E N E A Y L R P E T A Q G P Y V
- - - - - - - - - - - - Y L R P E T A Q G P Y -
------------------------------------TTCTTTCCATCCATAGGTTGGGAAATTTATTTC---
193194195196197198199200201202203204205206207208209210211212213214215216
M F K R E F I L H R Q K L P L G L A V V G K A F
- - - - - - - - - - - - - - L G L A V V G K A F
------------------------------------------TAACTCTCTAAACCTAAGCCTTTCTTCGGG
217218219220221222223224225226227228229230231232233234235236237238239240
R N E I S P R Q L L L R L R E F T Q A E L Q I F
R N - - - - - - - - - - - R E F T Q A E L Q I F
GATTCC---------------------------------AAAATAAGCATAAAACTCTGGGAATGGCAAATC
241242243244245246247248249250251252253254255256257258259260261262263264
F D P E D N E F D I N E V K D V E L N F L D K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G N Y K R I K V K D L P F P E F Y A Y F V G K V
- - - - - - - - - - - - - - - - Y A Y F V G K V
------------------------------------------------TGTGAACTCTCTCAATCTTAATAA
289290291292293294295296297298299300301302303304305306307308309310311312
K Q F Y E R L G I P E E R L R F R E L S E K E K
K Q F Y E - - - - - - - - - - - - - - - - - - -
TAATTGCCTAGGACT---------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A F Y N K Y H V D I E I N F P T Y G W K E V G G
- - - - - - H V D I E I - - - - - - - - E V G G
------------------TTTAAACATAACATATGG------------------------ATAAGCTTCATT
337338339340341342343344345346347348349350351352353354355356357358359360
I H Y R T D H D L S G H M K V S G K D L T V Q K
I H Y R - - - - - - - - - - - - - - - - - - - -
TTCAACCATTTT------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D N K K F I P H V L E L S F G V D R N V L A L I
- - - - - - P H V L E L S F G V D R N V L A - -
------------------TTGGGAATCGGGCCCAATATAAATGGGAAACATCAAATTGAACCATTT------
385386387388389390391392393394395396397398399400401402403404405406407408
D L F L T E E E Y E I E R D N Q K V K E K R V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L K I P K H L A P I K V A V F P L L K K P E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E K A K E V Y N M L K N Y F Y P I I Y D E Q G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I G R R Y R R V D E I G V P Y A I T I D Y Q T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E D N T V T I R D R D T M K Q V R V K I E D L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512
N Q L T L S S S
- - - - - - - -
------------------------
Class II
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_gly_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T E D V Y E R I M E I A R R R G F I L P A F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y G G A R G F Y D Y G P L G A L L K R K I E E
- - - - - - - - - - - - - - - - - L K R K I E E
---------------------------------------------------CGTGTCGTCCTCGAGAGTTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K W R E Y Y V H K E G F M E I E A P N L L I G E
K W R E Y Y V H . E G F M E I E A P N L L - - -
GTGGTCTACGGTGACGCAGTACGG---ACCGATCTCGTCGGCGCGAGCGTATCGTCTGCCTAT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V F E A S G H V E H F I D P M T H C S E C G E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F R A D H L A E E E L G V D A E G M S P E E L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D L I R E H D L R C P E C G G E L A E V T E F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L M F D T N I G P K E G R T G Y L R P E T A Q A
- - - - - - - - - - - - - - - Y L R P E T A Q A
---------------------------------------------GCACTCCGGTGGCACCTCTACCTCCTT
169170171172173174175176177178179180181182183184185186187188189190191192
I F I Q F K D L Y R W A R Q K L P F G V V Q I G
I F - - - - - - - - - - - - - - - F G V V Q I G
GCCGTC---------------------------------------------GGTGATCCGACGTAGCGCCTC
193194195196197198199200201202203204205206207208209210211212213214215216
R A Y R N E I S P R Q G V I R L R E F T Q A E A
R A Y R N - - - - - - - - - - - R E F T Q A E A
CGCGATCTTCGGGGC---------------------------------CACGGGTTCCGGGCGGTAGACTAT
217218219220221222223224225226227228229230231232233234235236237238239240
E V F F D P E E K E Y P G F E R Y A D E V L K F
E V F - - - - - - - - - - - - - - - - - - - - -
CTTGGGCTC---------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y P I E E Q R K E N G E M L E M S V R E A V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G M V S Q P I G Y F L G L T K R M L N E M G V P
- - - - - - I G Y F L G L T K R M L N - - - - -
------------------CCGCTCTTCGGGAAGGTGCTGACGCGATCGGATGGCTTC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
N E A I R S R Q H L P E E R A H Y A S D C W D V
- - - - - - - - - - - - - - - - - - - - C W D V
------------------------------------------------------------CTCCTCGACTGC
313314315316317318319320321322323324325326327328329330331332333334335336
E V K L E R F G W V E V V G I A D R T D Y D L K
E V - - - - - - - - E V V G I A D R - - - - - -
CTCACG------------------------GTTCTCCTTCCGCTGTTCCTCTAT------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K H S E H S G E D L R A F R E L E E P K I V Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P E P V M K E L G P R F K S D A P K I A E A L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R I T A E S E D E L K G G L T V E V D G K E V E
- - - - - S . . . . . . . . . . . . . . . . . .
---------------CTT------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V P P E C Y E I V K E K V T G E R F Y P H V I E
. . . . . . . . . . . . . . . . . . . . H V I E
------------------------------------------------------------GTTGAACTCAGT
433434435436437438439440441442443444445446447448449450451452453454455456
P S Y G I D R I L Y C V L E H N F D P E E G V F
P S Y G I D R I L Y C - - - - - - - - - - - - -
AACCTCAGCGAGCTCCCCACCGCACTCGGGACA---------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R F P A W L A P I E V G V F P L L K R S D M V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y A R R V A R M L R E E G F T V E Y D D S G S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G R R Y A R A D E I G V P Y C V T V D H E T L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D D T V T I R D R D T T E Q V R V E V D E L A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571
V L R G L I D G D L E F E E A G D P V
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_gly_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N H E R T M T V A R K R G F L W S S F E I Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G V A G F V D Y G P L G A T L K N K I M N R W R
- - - - - - - - - - - - - - L K N K I M N R W R
------------------------------------------CACCGTAACTGCAAATGGGACACCTATCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E F Y V V R E G F Y E I E S P T I M P E E A L K
E F Y V V . E G F Y E I E S P T I M - - - - - -
ATCTGCACGGGCATA---TCTTCCTATTGTTCCTGATGAATCAAATTCTGCAAT------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A S G H V D H F N D P M T Q C K E C M D V Y R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D H I I E D A T G R D V E G L E N Q E L T E I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S D E G I R C P R C G G H L T H V W S Y N L M F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q T L I G A R G K K T G Y L R P E T A Q G I F I
- - - - - - - - - - - - Y L R P E T A Q G I F -
------------------------------------CTCGAATTCACCCTCAAGGATGAACCTTCCCTC---
169170171172173174175176177178179180181182183184185186187188189190191192
P F K R L L R F F R N R L P F G V V Q L G K S Y
- - - - - - - - - - - - - - F G V V Q L G K S Y
------------------------------------------GGCACTGGCTATCCTGGCGGCATCCTTACG
193194195196197198199200201202203204205206207208209210211212213214215216
R N E I S P R Q G V I R L R E F T Q A E A E I F
R N - - - - - - - - - - - R E F T Q A E A E I F
GAATTT---------------------------------ACGTTTCCTAATCCTCCTTGGCTCATCATATTC
217218219220221222223224225226227228229230231232233234235236237238239240
V D P E H K T H P D F E E V K E D I L R L Y P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G R Q M E E S G T V D M T A A E A L E A G V I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S E V L T Y H L C L A K R F L M D I G I P E D A
- - - L T Y H L C L A K R F L M - - - - - - - -
---------TGGAAGGTGCTGCCTGAACCTCAGGGCATCCTCGGGGAT------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L R F R Q H L P S E M A H Y A I D C W D V E A F
- - - - - - - - - - - - - - - - - C W D V E A -
---------------------------------------------------AAGGGCCTCAGCGGCCGT---
313314315316317318319320321322323324325326327328329330331332333334335336
T D S Y G W I E I I G I A D R T D Y D L R S H S
- - - - - - - E I I G I A D R - - - - - - - - -
---------------------CATCTGTCTCCCGGCAGGGTACAG---------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q H S G E D L R V F I E Y D E P R R I R K R A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K P D M G K L G P K F R K D A A R I A S A L S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V D V E E I E K A L D E E G R F I L E G E F E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L P D D V S F E D V E E V V T G R K V Y P H V I
- - - - - - - - - - - - - - - - - - - - P H V I
------------------------------------------------------------GGTTAAGTGGCC
433434435436437438439440441442443444445446447448449450451452453454455456
E P S F G I D R I I Y T L L L H S L V D D G E R
E P S F G I D R I I Y T - - - - - - - - - - - -
TCCACACCTGGGACACCTTATCCCCTCATCTGATAT------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T Y F R L P P H V A P V E V T V L P L V N R E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
M V M T A L E I E R N L R R S G F I A E F D S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G T I G R R Y A R A D E I G V P F A V T V D H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T L E D G T V T L R N R D D C S Q V R V K I E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562
L V P T L E K L R G
- - - - - - - - - -
------------------------------
Class II
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_gly_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R R A E T L E E I V K R R L L Y W P S S E I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G G V G G F Y D Y G P L G V Q L R R N I V E K W
- - - - - - - - - - - - - - - L R R N I V E K W
---------------------------------------------CTAAGGCGTAATATAGTGGAGAAGTGG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R K V F V L P Y Q D L I I E V E T P I I M P E P
R K V F V L . . . D L I I E V E T P I I M - - -
CGTAAGGTGTTTGTACTC---------GATCTCATAATTGAAGTGGAGACGCCTATTATCATG---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V F K A S G H L D H F T D Y L V T C T K C G R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y R A D H L V E E E L A K R G L K I S T E G M S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A S D L E R L I S E H K I V C P H C G G P L G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V E T F N L L F K T T I G P Y S E N A G Y L R P
- - - - - - - - - - - - - - - - - - - - Y L R P
------------------------------------------------------------TATTTGAGGCCG
169170171172173174175176177178179180181182183184185186187188189190191192
E T A Q G M F V A F P R L A E Y V G R R H P F G
E T A Q G M F - - - - - - - - - - - - - - - F G
GAGACCGCCCAGGGTATGTTC---------------------------------------------TTCGGC
193194195196197198199200201202203204205206207208209210211212213214215216
V A Q I G R V A R N E I S P R G G L M R L R E F
V A Q I G R V A R N - - - - - - - - - - - R E F
GTGGCGCAGATTGGCCGGGTTGCGCGTAAT---------------------------------AGAGAGTTT
217218219220221222223224225226227228229230231232233234235236237238239240
T Q M E I E L F F D P Q N P K C P Y F A E V E S
T Q M E I E L F - - - - - - - - - - - - - - - -
ACGCAAATGGAGATAGAGCTGTTT------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F E I P I V P E E F V A K G Q T E P V Y L T A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E V V E R G H A N E W M A F F M A L A A K F L K
- - - - - - - - - - - M A F F M A L A A K F L K
---------------------------------ATGGCGTTTTTCATGGCGTTAGCCGCGAAGTTTTTAAAA
289290291292293294295296297298299300301302303304305306307308309310311312
E L G V P I E R Q K F L G K L P H E R A H Y S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K S Y D Q M V L T E R F G W V E V S G H A Y R T
- S Y D Q M V - - - - - - - - E V S G H A Y R -
---TCTTACGACCAAATGGTG------------------------GAGGTTTCCGGCCACGCCTACCGC---
337338339340341342343344345346347348349350351352353354355356357358359360
D Y D L S G H S K F S S R E M Y L E R R L S T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K E V E V V R L Y P N P N A I R E R Y G D K I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E V I K A I K E H E G R V I E A F N R G M S E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A L G E Y V I S R D M V Y I K L E K R K T D L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K F I P H V V E P S F G L D R I M Y V V L E S A
- - - P H V V E P S F G L D R I M Y V - - - - -
---------CCGCACGTGGTGGAGCCCTCCTTCGGGCTTGACAGAATTATGTATGTA---------------
457458459460461462463464465466467468469470471472473474475476477478479480
V V E E E G R V Y L R L P P D I A P V K A C I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P I V K R A D Y V E I G R T L W R S L A R Q G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V V L Y E D E G T I G S R Y A S C D E I G T P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A V T I D E K T P V D G T V T I R D R D T K R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V R V K L G D V V T F V S M V A G G A S F D D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586
A R A L G A A P V Q
- - - - - - - - - -
------------------------------
Class II
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_gly_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G S R S I A S E D R Y E Q V M E L A K R R G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F W P S Y E I Y G G V A G F Y D L G P L G A R L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------CTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K D K I I A L W R H Y F I R R H S H I V V E I E
K D K I I A L W R H Y F I R . . . H I V V E I E
GTAGTCCACGGTGATAGCTGCGGGCACGCCGATCTCATCTAC---------CCTTCGACCTATACTACCGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T P V I A P A R V F E A S G H L E H F T D P I V
T P V I A - - - - - - - - - - - - - - - - - - -
GTCATCATATATAGC---------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E C L N C R R K F R A D H L I E E R L D I K A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G L S L E E M T R I I R E H N I R C P V C G G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L G E V R S F N L L F K T T I G P Y S E N V G Y
- - - - - - - - - - - - - - - - - - - - - - - Y
---------------------------------------------------------------------TAT
169170171172173174175176177178179180181182183184185186187188189190191192
L R P E T A Q G M F V A F K R V H E V T R Q R L
L R P E T A Q G M F - - - - - - - - - - - - - -
CTTTACACCGGCTACCTCTATGAAGCCTTT------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P L G I A Q I G R V A R N E I S P R Q G M I R L
- L G I A Q I G R V A R N - - - - - - - - - - -
---AGCCTCTAGTATCTCTCTAGCTCGCTGGCGGAATGT---------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R E F T I A E M E F F F D P E D P W H G G I L E
R E F T I A E M E F F - - - - - - - - - - - - -
CCGCTTCTTTACCACCTTGGGCTCCTTGAACTG---------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E L L D R V S H R K L R I L R T D A K A K G I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K P E E Y G V R E A I E E G I I V T P W L A Y W
- - - - - - - - - - - - - - - - - - - - L A Y W
------------------------------------------------------------GTACATATTCTC
289290291292293294295296297298299300301302303304305306307308309310311312
M A V A R D F I M E L G V P Y E N M Y F E E K A
M A V A R D F I M - - - - - - - - - - - - - - -
GTAGGGTACACCGAGCTCCATTATGAA---------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P E E R A H Y A A Q T F D Q L V K V S R L G W V
- - - - - - - - - - T F D Q L V - - - - - - - -
------------------------------GTATTCTTCGGGCTTGTC------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E V S G H A Y R T D Y D L S R H M K Y S G Q D L
E V S G H A Y R - - - - - - - - - - - - - - - -
ACGGAGTATGCGTAGCTTCCGGTG------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R V F K Q F K E P K V V K K R V V I I D R A W A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G R T F R Q R A R E I L E A A Q N L D P D E V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K I L R D K G F I E V A G V K I P A E H V K I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E K V E K V T G K R F I P H V A E P S F G V E R
- - - - - - - - - - - - P H V A E P S F G V E R
------------------------------------CTCGCCCAGGGGGCCACCGCATACTGGGCAACGTAT
457458459460461462463464465466467468469470471472473474475476477478479480
L L F V T L D Y A Y S E K D G R V V L R I P R R
L L F V - - - - - - - - - - - - - - - - - - - -
ATTGTGTTCGCG------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I A P I E A A V F P I V R D E K L V E I A R S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
W W R I L E N G M Y A I Y D D D G S I G R R Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R V D E I G V P A A I T V D Y Q T L E D N T V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L R D R D T W K Q V R I P V D S V V D A L R R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590
I E G A D I T E L G K P I E
- - - - - - - - - - - - - -
------------------------------------------
Class II
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_gly_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N G K F D K Y E Y L Q D L M R R R G F A W G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F E I Y G G S R G F Y D Y G P L G A T I K R K I
- - - - - - - - - - - - - - - - - - - I K R K I
---------------------------------------------------------GTAAGGTGTTCCAAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E R K I R E A F I R E G F F E I E T P D I T P E
E R K I R E A F I R E G F F E I E T P D I T - -
TTCATCGTAGCGCATGTACCTCTTTCCTATGCTGTCCTTTTCATCGTAAACTACTATGAATCCCTC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q V F I A S G H V E K F V D P V V E C K K C G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R F R A D H L I E E F L G I D V E G K S A E E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S R I I R E H G L K C P E C G G E L S D V F Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N L M F E T Y I G P Y K D K K A Y L R P E T A Q
- - - - - - - - - - - - - - - - Y L R P E T A Q
------------------------------------------------ACCTTCAATCGTGACCTTTCCTTT
169170171172173174175176177178179180181182183184185186187188189190191192
G I F V N F K R L N A F A R N K L P F G V F Q I
G I F - - - - - - - - - - - - - - - F G V F Q I
CTCATTAAG---------------------------------------------AATTTCATTTATTTTCTT
193194195196197198199200201202203204205206207208209210211212213214215216
G K A Y R N E I S P R Q G M I R L R E F T Q A E
G K A Y R N - - - - - - - - - - - R E F T Q A E
TGCATCCGCCTTGAGCTT---------------------------------AATTCTCTTAACGACCTTCGG
217218219220221222223224225226227228229230231232233234235236237238239240
A E I F F N P N E T E H P H F N E V K H E K L K
A E I F - - - - - - - - - - - - - - - - - - - -
TTTGTCATAATG------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L Y P I E N Q L K E L G E V E V T A E E A V K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G Y V M N S F F A Y Y M V M I K K I L L D I G I
- - - - - - - F A Y Y M V M I K K I L L - - - -
---------------------GGGTAATTGTTGCCTGAATCGTATCTTATCCTCTGGAAT------------
289290291292293294295296297298299300301302303304305306307308309310311312
P E D K I R F R Q Q L P E E R A H Y S A D T W D
- - - - - - - - - - - - - - - - - - - - - T W D
---------------------------------------------------------------CACTGCTTC
313314315316317318319320321322323324325326327328329330331332333334335336
A E V Y S E R F G W V E C V G L A Y R T D Y D L
A E V - - - - - - - - E C V G L A Y R - - - - -
TTCAGCTGT------------------------AAGCTGGTTTTCTATTGGGTATAG---------------
337338339340341342343344345346347348349350351352353354355356357358359360
S R H M K M S G A D L T V M I H Y D K P K V V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R I Q V S L N M K K V G P K L K A D A K K I N E
- - - - - - - - - - V . . . . . . . . . . . . .
------------------------------AGA---------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I I K S M D Q K E L E K L V K D L N E K G K V T
. . . . M . . . . . . . . . . . . . . . . . . .
------------ATT---------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I E G Y E L S K E D F I V K E V E E K I T G E K
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I V P H V L E P S F G I D R P F Y L L L E N S L
I . . H . . E P S F G I D R P F Y L - - - - - -
GCT------CCC------TTCGGGGCACTTCAAACCATGTTCCCTAATTATCCT------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T V D E D G R I Y L K I K K D M A P I E V A V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P L V A K E P L T T I A Y E I Y R T L Q K E G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I V V Y D E K D S I G K R Y M R Y D E I G T P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
C V T V D N Q T P E D G T V T I R D R D T R E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570
I R V K I E E L P R K L K E L I F G
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_gly_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A A S N T I A K D R Y D R V I E L A K R R G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F W P S Y E I Y G G V A G F Y D L G P L G V R L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------CTG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K E K I V A L W R D Y F I R R H N H I V V E I E
K E K I V A L W R D Y F I R . . . H I V V E I E
GTAGTCTACGGTTATCGCGGCCGGCACTCCTATCTCGTCTAC---------CCTGCGGCCTATGCTTCCATC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T P V I A P A K V F E A S G H L E H F T D P I V
T P V I A - - - - - - - - - - - - - - - - - - -
ATCATCGTATATCGC---------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E C L R C R R K F R A D H L I E E K T G I R A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G L T L E E M T R I I R E H D I R C P V C G G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L S E V R A F N L L F K T T I G P Y S E S V G Y
- - - - - - - - - - - - - - - - - - - - - - - Y
---------------------------------------------------------------------TAT
169170171172173174175176177178179180181182183184185186187188189190191192
L R P E T A Q G M F V S F K R V F E V S R Q R L
L R P E T A Q G M F - - - - - - - - - - - - - -
TTTCTCGCCGGCCACCTCTATGTAGCCTTT------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P L G I A Q V G R V A R N E I S P R Q G I M R L
- L G I A Q V G R V A R N - - - - - - - - - - -
---TGCCTCTAGTATCTCGCGGGCACGCTTCCGGAAGGT---------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R E F T I A E M E F F F D P E D P W H G G V L E
R E F T I A E M E F F - - - - - - - - - - - - -
CTTCTTTCTGACTATCTTGGGCTCCTGGTACTG---------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E L L G S V E H R K L R I L R A E A K A Q G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K P E E Y G V R E A I E E G V V R T P W L A Y W
- - - - - - - - - - - - - - - - - - - - L A Y W
------------------------------------------------------------GTACATGTCCCC
289290291292293294295296297298299300301302303304305306307308309310311312
M A I A R D F V M E L G V P Y G D M Y F E E K A
M A I A R D F V M - - - - - - - - - - - - - - -
GTAGGGTACGCCCAACTCCATGACGAA---------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P E E R A H Y A A Q T F D Q L V R V S R L G W V
- - - - - - - - - - T F D Q L V - - - - - - - -
------------------------------GTACTCCTCGGGCTTCTC------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E V S G H A Y R T D Y D L R R H M Q Y S G H D L
E V S G H A Y R - - - - - - - - - - - - - - - -
GCGGAGTATGCGTAGCTTACGGTG------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R V F K Q Y Q E P K I V R K K M V L L D R A W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G R T F R K R A R E I L E A A R S L D P E T A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K E L R E K G Y I E V A G E K I P A E H I K I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E K E E K V T G K R F L P H V A E P S F G V E R
- - - - - - - - - - - - P H V A E P S F G V E R
------------------------------------CTCGCTGAGGGGGCCGCCGCACACGGGGCACCTTAT
457458459460461462463464465466467468469470471472473474475476477478479480
L I F V A L D H A Y S E R G E R V V L R L P R R
L I F V - - - - - - - - - - - - - - - - - - - -
ATCGTGCTCCCG------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I A P I E A A V F P I V R E E S L V R I A R D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
W R K L L E N G M Y A I Y D D D G S I G R R Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R V D E I G V P A A I T V D Y Q T L E D N T V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L R D R D T W K Q V R V P V N R I A E A V K K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590
I E G A S L E E I G T P T S
- - - - - - - - - - - - - -
------------------------------------------
Class II
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_gly_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q D R L E K I V S L C K R R G F I F P S S E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y G G L A A V Y D Y G P L G V E L K R N V Q Q R
- - - - - - - - - - - - - - - - L K R N V Q Q R
------------------------------------------------TTCGAGCGTCTGGCTGTCGATCGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W W E A M V Y E H E N I V G L D A A I L M H P M
W W E A M V Y E . . N I V G L D A A I L M - - -
GACGCAGAAGGGCGTGCCCACCTC------GCGCCGATAGCGCCGGCCGATGGCACCTTTCTC---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V W K A S G H V D A F N D P L I D D R Q S K R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y R A D Q L I E D Y I E K L R A K G E T E R A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A L H R R L I E A L N A E D M P K A L Y Q I I M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D E R I P S P D S G A F D W T E V R Q F N L M F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V T H V G P V A S E E T K V Y L R P E T A Q G I
- - - - - - - - - - - - - - Y L R P E T A Q G I
------------------------------------------CTGCCAGCCCATCGGGAACAGGTACTGAAT
193194195196197198199200201202203204205206207208209210211212213214215216
F V N F H N V K D S S R L Q I P F G I A Q I G K
F - - - - - - - - - - - - - - - F G I A Q I G K
ATC---------------------------------------------GCGCAGGTGATCCGGCCGGATACC
217218219220221222223224225226227228229230231232233234235236237238239240
A F R N E I V A R Q F I F R M R E F E Q M E M Q
A F R N - - - - - - - - - - - R E F E Q M E M Q
GTTTTCGATGTG---------------------------------CGCCTCCATCTGCGTGCCCGGCTTTAC
241242243244245246247248249250251252253254255256257258259260261262263264
Y F V K P G T Q M E A F E A W K E K R L Q W H I
Y F - - - - - - - - - F E A W K E K R L Q W H I
GAAGTA---------------------------CATCCGGAAGATGAACTGCCGGGCCACGATCTCATTGCG
265266267268269270271272273274275276277278279280281282283284285286287288
E N G I R P D H L R F H V H E K L A H Y A D A A
- - - - - - - - - - - - - - - - - - - - - - - A
---------------------------------------------------------------------GTT
289290291292293294295296297298299300301302303304305306307308309310311312
V D I Q Y L F P M G W Q E V E G I H S R T D Y D
V D I Q Y - - - - - - - E V E G I H S R - - - -
GACAAAAATGCCCTG---------------------GACCTTCGTTTCTTCGGAGGCCAC------------
313314315316317318319320321322323324325326327328329330331332333334335336
L R R H Q E F S G K K M E Y F D P Q T Q E R Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P Y V V E T S A G L D R T I L M L L C E A Y D E
P Y V V E T S A G L D R T I L M - - - - - - - -
CTCGTCCATGATGATCTGGTAGAGCGCCTTCGGCATGTCCTCGGCGTT------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E E V E G E T R V V L R L H P R L A P I K V A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L P L V R K D G M P E R A Q A L V R D L R P L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N T F Y D E K G A I G R R Y R R M D E V G T P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
C V T I D S Q T L E D G T V T V R D R D T M Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E R I P E T Q V L A Y I K D R L R H W K P V G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481
T
-
---
Class II
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_gly_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P D L Q T K V I E L A R R R G I F W P S Y E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y G G V A G L Y D I G P I G V R I K N K I V D L
- - - - - - - - - - - - - - - - I K N K I V D L
------------------------------------------------TCTTATTGTTACAGTATTATCAGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W R K H F I K D N S D F V V E I D T P A L T P Y
W R K H F I K D . . . F V V E I D T P A L T - -
CAATGTCATAGGATCTACGGTAAT---------CACACCGATTTCATCAACTCTGGCGTATCTTTT------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K V L E A S G H V D N F T D P V V E C N S C H N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V Y R A D H L V E E I A K V T T E G L P P S E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D K I I R E K G I K C P K C G G E L G E V R L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N L L F E T R I G P Y S T N K A F L R P E T A Q
- - - - - - - - - - - - - - - - F L R P E T A Q
------------------------------------------------TTCAACTATTTTCACATACATATC
169170171172173174175176177178179180181182183184185186187188189190191192
G M F T S F K R V Y E A F R Q K L P I G I A Q I
G M F - - - - - - - - - - - - - - - I G I A Q I
TATGTCTTT---------------------------------------------AACGGTTTTAGTATTTAT
193194195196197198199200201202203204205206207208209210211212213214215216
G K V G R N E I S P R Q G L I R M R E F T I M E
G K V G R N - - - - - - - - - - - R E F T I M E
TATTTCCATGATTGTTTT---------------------------------CTTGTTTAATATTAATGTTTT
217218219220221222223224225226227228229230231232233234235236237238239240
V E F F F D P T S D V E P P L D R L Y D L E I N
V E F F - - - - - - - - - - - - - - - - - - - -
CTTCTTAACAAT------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I L R G D D K A R G E E K Y T K Y K F S E I V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E K I V I N K W M A Y W M G V A S N F V N S L G
- - - - - - - - M A Y W M G V A S N F V N - - -
------------------------TGCTCTTTCATGTGGTAGCTTTTCCTCAAAGTAAAATGA---------
289290291292293294295296297298299300301302303304305306307308309310311312
I S S F Y F E E K L P H E R A H Y S K Q T F D Q
- - - - - - - - - - - - - - - - - - - - T F D Q
------------------------------------------------------------TATTTTCTCATT
313314315316317318319320321322323324325326327328329330331332333334335336
I V V I D N V K V E I S G H A Y R S D Y D L S R
I V - - - - - - - E I S G H A Y R - - - - - - -
AACTAT---------------------ATATTTTTCTTCGCCTCTTGCTTT---------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H S T Y S G Q D L S I F K K F D T P K I V K K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T L I L N K D L V T K E G R D F N K T I M E I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N T K T V E E I E R M I L N K E K V L G K D I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
M Y V K I V E R E E K I S G E R V I P H V I E P
- - - - - - - - - - - - - - - - - - P H V I E P
------------------------------------------------------TTCAAATAATAGGTTGAA
433434435436437438439440441442443444445446447448449450451452453454455456
S F G V E R C L Y L T L L N S Y M E K D G R I I
S F G V E R C L Y L - - - - - - - - - - - - - -
TAGTCTAACTTCTCCAAGCTCGCCACCACA------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L S L P K R L S P Y D I A I F P L L E K D E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K K A R E I Y D S L K E K Y D I I F D D S G S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G K R Y A R V D E I G V P Y S I T V D P M T L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D N T V T I R D R D S W Q Q I R V N I T D L M N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574
V L D R L F K G E D F N K L G K V V S N N E
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Archaea/Staphylothermus marinus/Smarinus_gly_aa
Archaea/Staphylothermus marinus/Smarinus_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V N K Q V D K Y Q I L L D L G K R R G L F W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S Y E I Y G G V A G F Y D F G P N G V L I K R N
- - - - - - - - - - - - - - - - - - - - I K R N
------------------------------------------------------------TTGGTAATCAAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I I N E W L N N L V Y N T G L V L E I E T P I I
I I N E W L N N L V Y . . G L V L E I E T P I I
TGTTATAGCATATGGTATACCTATTTCATCGGC------GTATCTTCGACCAATGCTTCCTTCTTCATCATA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T P R I V L K A S G H E D H F T D P I T E C T R
T - - - - - - - - - - - - - - - - - - - - - - -
GTA---------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C G R V F R A D H L I E E A L G I R A E G L S M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D E L W K L I K E H N I R C P E C G G E L T K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K P A L L L F K T E I G P Y K G S P A Y L R P E
- - - - - - - - - - - - - - - - - - - Y L R P E
---------------------------------------------------------TATTATGAAGCATTC
169170171172173174175176177178179180181182183184185186187188189190191192
T A Q G M F V S F K H V L N I A R N K L P L G I
T A Q G M F - - - - - - - - - - - - - - - L G I
GCGACTAAGTTTATAATT---------------------------------------------TTCAGCAGG
193194195196197198199200201202203204205206207208209210211212213214215216
A Q I G R V G R N E I S P R Q G L L R L R E F T
A Q I G R V G R N - - - - - - - - - - - R E F T
TATTTCATTGAGTTTTTTCATAACAGT---------------------------------CTTGGGGTTAGG
217218219220221222223224225226227228229230231232233234235236237238239240
I M E L E F F F D P E K A F E E T M K Y M T D E
I M E L E F F - - - - - - - - - - - - - - - - -
AACAATCTTAACAATTTTTTT---------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I R N E K L N I I T A E D K L R G E E K T R K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T A I E L I E N K I V K N P W M A Y W M A L G N
- - - - - - - - - - - - - - - M A Y W M A L G N
---------------------------------------------TTCCTCGGGAAGTTTCTCGTCGAAACG
289290291292293294295296297298299300301302303304305306307308309310311312
I F L R K L G I S S E K I R F D E K L P E E K A
I F L R - - - - - - - - - - - - - - - - - - - -
TATTTTTTCAGA------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H Y S E Q T F D Q E V Y T E K Y G W I E V A G Y
- - - - - T F D Q E V - - - - - - - - E V A G Y
---------------ATTCTCAATTAATTCAAT------------------------TTCTCCTCTCAACTT
337338339340341342343344345346347348349350351352353354355356357358359360
S Y R T T Y D L S R H I K Y S K A D L T Y F K K
S Y R - - - - - - - - - - - - - - - - - - - - -
GTCCTCAGC---------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y D K P I K K K I V K I V P N P K K I R E I V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K D I G T V M K K L N E I P A E K I L E E L N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N N Y V E I S N Y K L S R E C F I I S E K E E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I H G E K I I P H V V E P S F G L E R I F Y V V
- - - - - - - P H V V E P S F G L E R I F Y V -
---------------------CAATAAAAGTGCTGGTTTAGGCTTTGTTAATTCTCCTCCACATTCTGG---
457458459460461462463464465466467468469470471472473474475476477478479480
L E N S I S I A R D G R I V L K L P P R I A P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K V A V F P L V T G N K P E H K K M V S I A R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V Y R A L L E N N I L A Y Y D E E G S I G R R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A R A D E I G I P Y A I T I D Y Q T L E D E T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
T L R D R D S R E Q I R L H I Q E L H D K L I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588
L L G L K K E F N I E F
- - - - - - - - - - - -
------------------------------------
Class II
Archaea/Archaeoglobus fulgidus/amino acid sequences/gly_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E I M E M L I R R G F L W Q S F E I Y G G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A G F I D Y A P L G N N L R R K I E N I W R K Y
- - - - - - - - - - - - L R R K I E N I W R K Y
------------------------------------CTCAGAAGGAAGATTGAGAACATCTGGCGGAAGTAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F V I N E R A A E I D T P T I G I E E V F I A S
F V I . E R A A E I D T P T I G - - - - - - - -
TTCGTGATC---GAAAGAGCGGCTGAGATTGACACACCAACCATAGGC------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G H A T S F T D V A I E C E N C G R V Y R A D H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y V K E K L G I E V D E T V E A V K E V M E V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D L K C E C G G R F K D P A P M N L M F S T T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G P G K G K K G Y L R P E T A Q G M F V D F K R
- - - - - - - - Y L R P E T A Q G M F - - - - -
------------------------TACCTTCGCCCCGAAACCGCTCAGGGAATGTTT---------------
169170171172173174175176177178179180181182183184185186187188189190191192
L A N F F R E K L P F G V A Q I G R A Y R N E I
- - - - - - - - - - F G V A Q I G R A Y R N - -
------------------------------TTCGGTGTGGCGCAGATTGGAAGGGCTTACAGGAAC------
193194195196197198199200201202203204205206207208209210211212213214215216
S P R Q G V I R L R E F N Q A E L E F F V H P G
- - - - - - - - - R E F N Q A E L E F F - - - -
---------------------------AGAGAGTTCAATCAGGCGGAGCTGGAGTTCTTC------------
217218219220221222223224225226227228229230231232233234235236237238239240
E K K H P H F S L Y A K D V V K L V D K F D S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H E I T L E E A V E K G I I A N Q I L A Y F I G
- - - - - - - - - - - - - - - - - - L A Y F I G
------------------------------------------------------CTGGCGTACTTCATAGGA
265266267268269270271272273274275276277278279280281282283284285286287288
K T R R F L L E I G I K D E K L R F R Q H K D D
K T R R F L L - - - - - - - - - - - - - - - - -
AAGACGAGGCGATTTCTGCTT---------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E R A H Y A T D C W D A E V L T S Y G W I E V V
- - - - - - - - C W D A E V - - - - - - - E V V
------------------------TGCTGGGATGCAGAAGTT---------------------GAGGTTGTT
313314315316317318319320321322323324325326327328329330331332333334335336
G I A D R T N Y D L K R H S K F S G E D L S V F
G I A D R - - - - - - - - - - - - - - - - - - -
GGCATTGCGGACAGA---------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V P Y E E P V K V K R R K I V P I L S K L G P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F R Q K A K K V A E A L E A L N V E A D L D E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E V E V D G E K V K V T K E F F E I Q E V E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V T G E K V I P H V I E P S F G L D R I T Y S V
- - - - - - I . H V I E P S F G L D R I T Y S -
------------------ATA---CACGTCATAGAGCCATCCTTCGGCCTTGACAGGATTACCTACTCC---
433434435436437438439440441442443444445446447448449450451452453454455456
L E H A F D K D V V D G E E R R V L R L K R W V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S P I E V A V L P L L S R E P F E S K G M E I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q M L R E E G I F T D Y D D S G S I G R R Y R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F D E I G T P F C V T V D H Q T F E D E T V T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R D R D T T A Q V R V K L G E L P S I L K E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568
R S E K D I T E F G E V F R Q V
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_gly_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D K Y E K V F E L A K R R G F L W N S F E L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G G S R G F Y D Y G P L G S T L K R R I E Q V W
- - - - - - - - - - - - - - - L K R R I E Q V W
---------------------------------------------CCTTATTGTGACAGTCCCATCCTGAAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R E F Y V I Q E G H M E I E C P T I G I E E V F
R E F Y V I . E G H M E I E C P T I G - - - - -
AGTGTCATAGTCCACGGT---CGAGTAAGGAGTCCCGATTTCATCGTTTCTCCTGTA---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I A S G H V G G F S D P L C E C M N C K E A F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A D H L V E N V T E A A G T L S A E E L T K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R E K E I R C P E C G G E F E D A Y E F N L M F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K T T I G P G T G R Q G Y L R P E T A Q G M F V
- - - - - - - - - - - - Y L R P E T A Q G M F -
------------------------------------GGCCGCTTTCTGGGCAACGTTTTCTTCGTCAAA---
169170171172173174175176177178179180181182183184185186187188189190191192
D F Q R L S R F Y R D K L P F G A V Q I G K S Y
- - - - - - - - - - - - - - F G A V Q I G K S Y
------------------------------------------AGGTTCAATCACGTGAGGAATGACGTTTTC
193194195196197198199200201202203204205206207208209210211212213214215216
R N E I A P R Q G V I R L R E F T Q A E C E L F
R N - - - - - - - - - - - R E F T Q A E C E L F
TCCGCT---------------------------------GTCCGGGCTGACAGTCAGTTCTTCTCCATCCAA
217218219220221222223224225226227228229230231232233234235236237238239240
V D P R N K K H P N F E R F A D K E L V L Y S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A A Q Q T G E P V R L T V R E A V E T G V I A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E I L G Y N I A L T N E F L T K V G I D P E K L
- - L G Y N I A L T N E F L T - - - - - - - - -
------TTCCACATAAACATAAAGGTCGGTCTTGCTGACCCTTGC---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R F R Q H L T D E M A H Y A I D C W D A E I E T
- - - - - - - - - - - - - - - - C W D A E I - -
------------------------------------------------TTCGGCGTCCCAGCAGTC------
313314315316317318319320321322323324325326327328329330331332333334335336
D R F G W V E I V G I A D R T D Y D L K A H A R
- - - - - - E I V G I A D R - - - - - - - - - -
------------------CGTCAGGTGCTGCCTGAACCTGAG------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V S K T D L Y V Y V E Y D E P K I V T R F V V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P N M G K L G P L F K G K A K A V A D A L K Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S E E E L S K D Q I K V T L D G E E L T V S P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V V D F A E E N I K V S G E N V I P H V I E P S
- - - - - - - - - - - - - - - - - P H V I E P S
---------------------------------------------------GATCTGCACCGCCCCGAAAGG
433434435436437438439440441442443444445446447448449450451452453454455456
Y G I D R I F Y G I M E H A F D E E N V A Q K A
Y G I D R I F Y G - - - - - - - - - - - - - - -
CAGCTTATCCCTGTAGAAGCGGGACAG---------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A E S G L K G A G E A E G T E D A G K E S G G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K S E S E A E G E E A R L V M H F S S A V A P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q V A V L P L L T R K E L A D P A K E I I A K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R E K T L L V N Y D D S G T I G R R Y R R N D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I G T P Y S V T V D Y D T L Q D G T V T I R D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D S M R Q V R A P I N G I E N V L Y E L I Y R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612
R D F E S A G K P F N F
- - - - - - - - - - - -
------------------------------------
Class II
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_gly_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E T P N T K D K Y E K V M D L A K R R G Y L W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S S F E I Y G G I A G F V D Y A P L G A M L K N
- - - - - - - - - - - - - - - - - - - - - L K N
---------------------------------------------------------------TACCTCGTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N I I D T W R K H Y I T N E E F Y E I D C P T I
N I I D T W R K H Y I T . E E F Y E I D C P T I
CATTCTCATATATCTTCTTCCTATTGCTCCGCTGTC---ATATTCTGCAAGAATTCCGTTTTTTCTTAAATT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T P H D V L K A S G H V D N F T D P M I E C K E
T - - - - - - - - - - - - - - - - - - - - - - -
GTT---------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
C L E S Y R A D H I I E E N I D I D T E G K T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E E L Q Q L M E T H K I T C P K C S G Q F G E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K S Y N L M F L T S I G P S G N R I G Y M R P E
- - - - - - - - - - - - - - - - - - - Y M R P E
---------------------------------------------------------TAATATATATTCTTC
169170171172173174175176177178179180181182183184185186187188189190191192
T A Q G I F I Q F R R L S Q F F R N K L P F G V
T A Q G I F - - - - - - - - - - - - - - - F G V
TCCATTTTTAATGGTATT---------------------------------------------GCTTACTAA
193194195196197198199200201202203204205206207208209210211212213214215216
A Q I G K A Y R N E I S P R Q G V I R L R E F T
A Q I G K A Y R N - - - - - - - - - - - R E F T
TTTCATATCTTTTTTAAATACTTTGCC---------------------------------CTCAATTTCCTT
217218219220221222223224225226227228229230231232233234235236237238239240
Q A E A E F F V H P T I K E H K K F K E V E N D
Q A E A E F F - - - - - - - - - - - - - - - - -
TGGTTCGTCATATTCTACAAA---------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V I P L L P A S R Q M D E S L P K D E K V I N M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S L K D A V E N N I I R H E T I A Y F V A I T K
- - - - - - - - - - - - - - - I A Y F V A I T K
---------------------------------------------TAATTTGGAGCTGTCAATACCTATATC
289290291292293294295296297298299300301302303304305306307308309310311312
R F L L D I G I D S S K L R F R Q H L P D E M A
R F L L - - - - - - - - - - - - - - - - - - - -
CAACAAAAACCT------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H Y A I D C W D A E I Y T D R F G W I E C V G I
- - - - - C W D A E I - - - - - - - - E C V G I
---------------ATTTATTACTTTTTCATC------------------------CCTACTTGCAGGTAA
337338339340341342343344345346347348349350351352353354355356357358359360
A D R T D F D L K A H M E N S G V D L S I F V E
A D R - - - - - - - - - - - - - - - - - - - - -
TAGGGGTAT---------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y D E P K E I E T Y E I E L N Y K V V G K V F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K D M K L V S D A L N E L D N N E M E K L V N T
- - - - - - S . . . . . . . . . . . . . . . . .
------------------AAA---------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I K N G E E Y I L K V G D K E F T I L E D Y L T
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A K K V Q K K V M G E K V L P H V I E P S H G I
. . . . . . . . . . . . . . . H V I E P S H G I
---------------------------------------------TGTGATTTTGTGAGTCTCCATTAATTG
457458459460461462463464465466467468469470471472473474475476477478479480
D R I T F C L L E H S F N E E E D R T Y L S I N
D R I T F C - - - - - - - - - - - - - - - - - -
TTGTAATTCCTCTAAGGT------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P T V S P I K V G V F P L V N K Q G M P E I A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D I K N N L R K N G I L A E Y D D S G A I G R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y M R M D E V G A P F C I T V D G Q T L E D N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I T I R E R D S R E Q I R I K I E E V V D Y I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579
N K L
- - -
---------
Class II
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_gly_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D V F D N V M D L A K R R G F V W P T T E C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y G S V A G F I D Y G P L G T L V K R R I E D L
- - - - - - - - - - - - - - - - V K R R I E D L
------------------------------------------------GTCAAACGTCGTATCGAAGACCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W R Q F Y V I S E G Y Y E I E C P T I G Q E A M
W R Q F Y V I . E G Y Y E I E C P T I G - - - -
TGGCGCCAGTTCTATGTAATA---GAAGGGTATTATGAGATAGAATGCCCGACAATCGGC------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y I A S G H V K G F S D K M C Q C P A C N E Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R A D H V A E A H N I P N A A T L S C E A L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K I C T L P C P A C N E V L G K V E V F T F N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M F Q T T I G P G S Q R K G Y L R P E T A Q G I
- - - - - - - - - - - - - - Y L R P E T A Q G I
------------------------------------------TACCTTCGGCCTGAAACCGCTCAGGGTATC
169170171172173174175176177178179180181182183184185186187188189190191192
F V D F G R L L R F Y R D K L P F G T V Q I G R
F - - - - - - - - - - - - - - - F G T V Q I G R
TTC---------------------------------------------TTCGGAACCGTGCAGATAGGACGG
193194195196197198199200201202203204205206207208209210211212213214215216
S Y R N E I S P R Q G M I R L R E F T Q A E A E
S Y R N - - - - - - - - - - - R E F T Q A E A E
TCATACCGGAAT---------------------------------CGTGAATTCACCCAGGCTGAGGCTGAG
217218219220221222223224225226227228229230231232233234235236237238239240
I F V H P E M K D H P N F A R Y A D Y A F P L L
I F - - - - - - - - - - - - - - - - - - - - - -
ATCTTT------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S S E Q Q L G G L E A K T Y T M K D A V A A G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I A N E Y V A Y Y L A L T H E L L V T I G V M P
- - - - - V A Y Y L A L T H E L L V - - - - - -
---------------GTTGCCTACTACCTTGCCCTGACCCACGAACTCCTGGTC------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S R L R F R Q H L P D E R A H Y A E D C W D A E
- - - - - - - - - - - - - - - - - - - C W D A E
---------------------------------------------------------TGCTGGGATGCTGAG
313314315316317318319320321322323324325326327328329330331332333334335336
I F S E R F G W V E T V G I A D R T D Y D L K A
I - - - - - - - - E T V G I A D R - - - - - - -
ATA------------------------GAAACGGTTGGTATTGCAGACCGG---------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H A E Q S G D S F T A Y I Q Y D E P R R E K R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V I N A N M G V L G P K Y R G K A K A I S D A L
- - - - - - - - - - - - - - - - - - - - S . . .
------------------------------------------------------------TCT---------
385386387388389390391392393394395396397398399400401402403404405406407408
Q E V T P G P D G A T V I I D G E E I F V P A D
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L Y E V K E E E V D V R G V D V R P H V I E P S
. . . . . . . . . . . . . . . . . . H V I E P S
------------------------------------------------------CACGTTATCGAGCCCAGT
433434435436437438439440441442443444445446447448449450451452453454455456
Y G I D R M I Y A V L E H S Y F E E E V E G E V
Y G I D R M I Y A - - - - - - - - - - - - - - -
TATGGGATTGACCGGATGATCTATGCC---------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R K V M R F P S R V A P V Q V A I F P L M A R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G L D V M A K E I A R T L Q M Q G I L A E Y D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
S G A I G R R Y R R Q D E I G T P F A V T V D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D S L E D Q T V T L R D R D S M Q Q V R I P K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572
Q L V D L I P A L I R G K S S F S S L I
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_gly_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K D I Y E K I M D L A K R R G Y L W S S F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y G G I A G F V D Y G P L G C L L K N N I I S
- - - - - - - - - - - - - - - - - L K N N I I S
---------------------------------------------------TTAAAAAATAACATCATATCA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K F R E Q Y I I K E G F Y E I E S P T V T P Y E
K F R E Q Y I I . E G F Y E I E S P T V T - - -
AAGTTTAGAGAGCAATATATTATT---GAAGGATTTTATGAGATTGAAAGCCCAACAGTAACA---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L K A S G H V D N F T D P I V E C K N C L E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F R A D H L I E E F V D V D T E G K T L K E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E L I R K H N I R C P K C G G E L G E V K K F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L M F V T S I G P G G K R T G Y M R P E T A Q G
- - - - - - - - - - - - - - - Y M R P E T A Q G
---------------------------------------------TACATGAGACCTGAAACAGCACAGGGA
169170171172173174175176177178179180181182183184185186187188189190191192
I F I Q F R R L A Q F F R N K L P F G V V Q I G
I F - - - - - - - - - - - - - - - F G V V Q I G
ATATTT---------------------------------------------TTTGGTGTTGTTCAAATTGGT
193194195196197198199200201202203204205206207208209210211212213214215216
K S Y R N E I S P R Q G V I R L R E F T Q A E I
K S Y R N - - - - - - - - - - - R E F T Q A E I
AAAAGTTATAGAAAT---------------------------------AGAGAATTCACCCAGGCAGAGATT
217218219220221222223224225226227228229230231232233234235236237238239240
E Y F V H P E R K E H E K F D L V K D E V V P L
E Y F - - - - - - - - - - - - - - - - - - - - -
GAATATTTT---------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L P A E R Q M D E N L S D D E K V I K I S I G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A V E K G I I R H Q T I A Y F I A L T K R F L E
- - - - - - - - - - - I A Y F I A L T K R F L E
---------------------------------ATTGCCTACTTTATAGCTCTAACAAAGAGGTTTTTAGAA
289290291292293294295296297298299300301302303304305306307308309310311312
A I G I D K D K I R F R Q H L P N E M A H Y A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D C W D A E I Y T E R F G W I E C V G I A D R T
- C W D A E I - - - - - - - - E C V G I A D R -
---TGTTGGGATGCTGAAATA------------------------GAGTGTGTTGGGATTGCAGATAGA---
337338339340341342343344345346347348349350351352353354355356357358359360
D Y D L R S H S A H S G V E L S V F V E L D E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R E I E T Y E I N L N Y K V V G K I F K K D T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A I E A Y I N N L S E K E K E E F V K N I E N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G K V I I N I D G K E F E I L K D Y V E I K K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K K V I K G E K V I P H V I E P S Y G I D R I T
- - - - - - - - - - P H V I E P S Y G I D R I T
------------------------------CCTCACGTTATAGAGCCATCCTATGGAATTGATAGAATAACC
457458459460461462463464465466467468469470471472473474475476477478479480
Y C L L E H S Y R E E E D R V Y L D L K P S I A
Y C - - - - - - - - - - - - - - - - - - - - - -
TACTGT------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
P I K A Y V L P L V N K D D M P K I A K E I E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
M L R E N G I I A E Y D D S G A I G R R Y M R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D E I G V P F C I T V D G Q T L E D R T V T V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E R N T R E Q V R V K I D E L V D Y L K E R L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577
E
-
---
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_gly_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D T H S S S L L A I V S H A K E Y G F I Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S S E I Y E G L Q A V Y D Y G P Y G A A L K R N
- - - - - - - - - - - - - - - - - - - - L K R N
------------------------------------------------------------TACCGTATCGTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V Q N L W W Q S M T Q L H S N I V G M D A A I L
V Q N L W W Q S M T . L H . N I V G M D A A I L
TTCTAAGGTTTGATGGTCTATGGTAATACA---GGGGGT---TATTAAATCTTGCCTAGCATATCGTTTACC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M H P R T W K A S G H V D S F E D L M V D N K D
M - - - - - - - - - - - - - - - - - - - - - - -
AAT---------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S K K R Y R I D V L I E N H A A E L S A Q G E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T R A Q E L L E K L Q A L L Q A E E L A G L H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L L L Q E K I V C P I S R T A N W T E V H R F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L M F A T K V G A Q E E N A D T I Y L R P E T A
- - - - - - - - - - - - - - - - - Y L R P E T A
---------------------------------------------------TGATCGTGCATGAATGCCTTC
193194195196197198199200201202203204205206207208209210211212213214215216
Q G I F V N F L N V Q K T A R M K V P F G I A Q
Q G I F - - - - - - - - - - - - - - - F G I A Q
TATCTCTTTATA---------------------------------------------GTGAGCTAATTGAGC
217218219220221222223224225226227228229230231232233234235236237238239240
I G K A F R N E I V A R Q F I F R M R E F E Q M
I G K A F R N - - - - - - - - - - - R E F E Q M
ATGCGGCTTGATTCTTAGTTT---------------------------------CCAACGTGCTTGTTGCCA
241242243244245246247248249250251252253254255256257258259260261262263264
E M Q F F I Q P G S E E K W F N Y W Q Q A R W Q
E M Q F F - - - - - - - - - F N Y W Q Q A R W Q
ATAATTAAACCACTT---------------------------CTGCATTTCCATCTGCTCAAACTCACGCAT
265266267268269270271272273274275276277278279280281282283284285286287288
W H I A L G L T E E K L R I K P H A Q L A H Y A
W H I - - - - - - - - - - - - - - - - - - - - -
ACGGAATAT---------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K A A V D I E Y Q F P F G Y K E I E G I H A R S
- - A V D I E Y - - - - - - - E I E G I H A R -
------CCGAGCTGTTTTTTGTAC---------------------GCCTTGTGCTGTTTCTGGCCTTAA---
313314315316317318319320321322323324325326327328329330331332333334335336
D F D L K N H E V A S R K K L Q Y F D P E L N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N Y L P H V I E T S L G S D R L I L M L L C E A
- - - P H V I E T S L G S D R L I L M - - - - -
---------AGTACGTGATATAGGACATACAATCTTTTCTTGTAGTAAGAGCGTGTG---------------
361362363364365366367368369370371372373374375376377378379380381382383384
F T E E T I T E E E S A K T R T Y L K L H P A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A P I K A A I F P L V K K D N L P Q K A Q E I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K S L K Y D F P L I Y E E N Q S I G K R Y A R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D L I G T P Y C I T I D H Q T L E D D T V T L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E R D S M Q Q E R V H V N I L R D F L L E K V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496
F K S I L A K L P T I D S V L I
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_gly_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P T K L D M A K F A K F C K D M G F V F Q S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E I Y G G I N G F W D Y G P L G V E L K R N I K
- - - - - - - - - - - - - - - - - - L K R N I K
------------------------------------------------------AATGCAGAACGGGGTGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E A W W Q D M V R N P P P G P D G Q E I R M V G
E A W W Q D M V . N P . . . . . . . . . R M V G
GGCCTCGTCCTGGCGCCGGTACCG---CCCGAT---------------------------GAAGAACGGCTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L D C S I I M N P N V W V A S G H V G G F S D P
L D C S I I M - - - - - - - - - - - - - - - - -
GAGCTCGCGGTAGAGCTTCTT---------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M V D C L K C K K R F R A D K V H F A C A V V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S A P H A I S V E A D N A T D A E P L L K E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A K L D K K K H P V G R A L K A A A Q L E Y H S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A T A L P A S W P R P C P A E D C D G T L T E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R A F N L M F E S H A G P I A S D E N K V Y L R
- - - - - - - - - - - - - - - - - - - - - Y L R
---------------------------------------------------------------CTGCGGCTC
217218219220221222223224225226227228229230231232233234235236237238239240
P E T A Q G I F A N Y K N V L D S S R L K L P F
P E T A Q G I F - - - - - - - - - - - - - - - F
GTCCGAGAACGGGAACATGTACTC---------------------------------------------CTG
241242243244245246247248249250251252253254255256257258259260261262263264
G I A Q V G K A F R N E I N P R N F T F R S R E
G I A Q V G K A F R N - - - - - - - - - - - R E
TTCGCGCGGCACGAGGTTCTCGCTCTTCAGCCC---------------------------------CCAGTA
265266267268269270271272273274275276277278279280281282283284285286287288
F E Q M E I E F F C H P N E S R K W Y E Y W R D
F E Q M E I E F F - - - - - - - - - Y E Y W R D
TTCGTACCACTTCCGCGACTCGTTCGG---------------------------CTCGAACTCGCGCGACCG
289290291292293294295296297298299300301302303304305306307308309310311312
L R R Q W Y S R L G L K S E N L V P R E Q G Q E
L R R Q W Y S - - - - - - - - - - - - - - - - -
GAACGTGAAGTTCCGCGGGTT---------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E L A H Y S V G T T D I E Y M F P F S D E P Q E
- - - - - - - - T T D I E Y - - - - - - - - - E
------------------------CTTGTAGTTGGCGAAGAT---------------------------GAC
337338339340341342343344345346347348349350351352353354355356357358359360
L E G V A H R G D F D L S A H S S R S G K D L K
L E G V A H R - - - - - - - - - - - - - - - - -
CTTGTTCTCGTCCGACGCGAT---------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Y F D E E G W N A L L Q A R L E A F K D D K A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R E E E K K K L E K E E K A Q F Q F V P H V I E
- - - - - - - - - - - - - - - - - - - P H V I E
---------------------------------------------------------GGCGATCTTCTCTTT
409410411412413414415416417418419420421422423424425426427428429430431432
P S A G A D R F T L A V L C E A Y T E D T A P D
P S A G A D R F T L A - - - - - - - - - - - - -
GAGCAGCGGTTCGGCGTCCGTGGCATTGTCGGC---------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A K G N P E T R I V M K F H P R L A P I K A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F P L V N K D G M D E E A K K L Y R E L K P F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N V V Y D Q S G A I G R R Y R R Q D E A G T P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
C I T V D G D T M K D G T V T I R D R D T L K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547
E R I P K S E V R K V L E K A L S P V
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_gly_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A V T M E E I V A H A K H R G F V F P G S E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y G G L A N T W D Y G P L G V E L K N N I K R A
- - - - - - - - - - - - - - - - L K N N I K R A
------------------------------------------------CGTGATGCAAAACGGCGTGCCGAT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W W K K F V Q E S P Y N V G L D A A I L M N P R
W W K K F V . E S . Y N V G L D A A I L M - - -
TTCATCTTGGCGGCGGTA---CTTGCC---CGAGCCGGTTTCGTCATAGTCGACCATGAAATG---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T W E A S G H L G N F N D P M V D C K Q C K A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H R A D K L I E K A L E E K G I E M I V D G L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L A K M D E L I K E Y D I A C P E C G S R D F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N V R Q F N L M F K T Y Q G V T E S S A N E I Y
- - - - - - - - - - - - - - - - - - - - - - - Y
---------------------------------------------------------------------CGA
169170171172173174175176177178179180181182183184185186187188189190191192
L R P E T A Q G I F V N F K N V Q R T M R K K L
L R P E T A Q G I F - - - - - - - - - - - - - -
CGCAATGCCCCAGAGCTCGCCCCAGCCGAA------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P F G I A Q I G K S F R N E I T P G N F T F R T
- F G I A Q I G K S F R N - - - - - - - - - - -
---CAACTCTTCTTTCGCATGGTCGCGCAGGCGGATGTT---------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R E F E Q M E L E F F C K P G E E L Q W F D Y W
R E F E Q M E L E F F - - - - - - - - - F D Y W
CTTGCAAAACTGTTTCCAATAGTCAAACCATTG---------------------------CTCGAGCTCCAT
241242243244245246247248249250251252253254255256257258259260261262263264
K Q F C K D W L L S L G M K E D N I R L R D H A
K Q F C K D W L L - - - - - - - - - - - - - - -
CTGTTCGAATTCGCGCGTGCGGAACGT---------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K E E L S H Y S N A T T D I E Y H F P F G W G E
- - - - - - - - - - T T D I E Y - - - - - - - E
------------------------------CGTGCGCTGGACGTTTTT---------------------CGC
289290291292293294295296297298299300301302303304305306307308309310311312
L W G I A S R T D Y D L K Q H M E H S G E D F H
L W G I A S R - - - - - - - - - - - - - - - - -
TGTCTCTGGACGCAAATAAAT---------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y L D Q E T N E R Y I P Y C I E P S L G A D R V
- - - - - - - - - - - P Y C I E P S L G A D R V
---------------------------------GCATTCCGGGCAGGCGATGTCGTACTCCTTGATGAGTTC
337338339340341342343344345346347348349350351352353354355356357358359360
T L A F M I D A Y D E E E L E D G T T R T V M H
T L A - - - - - - - - - - - - - - - - - - - - -
ATCCATTTT---------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L H P A L A P Y K A A V L P L S K K L A D G A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R I Y E E L A K H F M V D Y D E T G S I G K R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R R Q D E I G T P F C I T Y D F E S E Q D G Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T V R D R D T M E Q V R L P I G E L K A F L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460
K I A F
- - - -
------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_gly_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P A T S M D E L V S L C K R R G F I F P G S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y G G L Q G T Y D Y G P L G I E L K N N L K A
- - - - - - - - - - - - - - - - - L K N N L K A
---------------------------------------------------CTCAAAAACAATCTCAAAGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A W W R A M V Y E R D D V E G L D A S I L T H R
A W W R A M V . E R D . V E G L D A S I L T - -
GCGTGGTGGCGAGCTATGGTC---GAACGCGAC---GTGGAAGGCCTCGATGCCTCAATTTTGACC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L V L R H S G H E A T F T D P M V D C R N C K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R W R A D Q L K D N K C E K C G S T D L T E P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P F N L M F K T A V G P I A E E G S F A Y L R P
- - - - - - - - - - - - - - - - - - - - Y L R P
------------------------------------------------------------TACTTGCGACCC
145146147148149150151152153154155156157158159160161162163164165166167168
E T A Q G I F T N F K N V V D A T S R R L P F G
E T A Q G I F - - - - - - - - - - - - - - - F G
GAAACCGCCCAAGGGATTTTT---------------------------------------------TTTGGC
169170171172173174175176177178179180181182183184185186187188189190191192
I A Q I G K A F R N E I T P R N F I F R V R E F
I A Q I G K A F R N - - - - - - - - - - - R E F
ATCGCCCAAATCGGTAAGGCCTTCCGCAAC---------------------------------CGTGAATTC
193194195196197198199200201202203204205206207208209210211212213214215216
E Q M E L E F F V Q P G T D D E W H S Q W V E A
E Q M E L E F F - - - - - - - - - H S Q W V E A
GAGCAAATGGAGCTTGAATTCTTC---------------------------CATAGCCAATGGGTTGAAGCT
217218219220221222223224225226227228229230231232233234235236237238239240
R L Q W W R D Q G L L S E N L Q A Y H Q A G D E
R L Q W W R - - - - - - - - - - - - - - - - - -
CGCTTGCAATGGTGGCGT------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L A H Y A K A T V D I L Y Q F P H G L E E L E G
- - - - - - - T V D I L Y - - - - - - - E L E G
---------------------ACCGTCGATATTCTCTAT---------------------GAACTAGAGGGG
265266267268269270271272273274275276277278279280281282283284285286287288
I A N R T D F D L G S H T R G Q A D L G L S A K
I A N R - - - - - - - - - - - - - - - - - - - -
ATTGCTAATCGA------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V D P N E D S T A K L T I P H P E T Q K P L V P
- - - - - - - - - - - - - - - - - - - - - - - P
---------------------------------------------------------------------CCA
313314315316317318319320321322323324325326327328329330331332333334335336
F V I E P S A G V D R G V L A I L T E A F T K E
F V I E P S A G V D R G V L A - - - - - - - - -
TTCGTGATCGAGCCATCGGCTGGGGTTGATCGGGGGGTATTGGCG---------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T L E N G S E R I V L K L K P H L A P I K V A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L P L A R N K P E I V E K A K A I K S L L M A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G I G R I F Y E D T G N I G K G Y R R H D E V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T P F C V T V D F D T L G R G D D A S L L D T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T V R D R D T M S Q V R I H I N E L A S Y I R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459
R L V
- - -
---------
Class II
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_gly_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K N N K L V N L I N H L K T Q G F V Y Q G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E I Y G G L A N T W D Y G P L G S L L L N N I K
- - - - - - - - - - - - - - - - - - L L N N I K
------------------------------------------------------AAGAGCGAAAAATGTTCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N E W I K Y F I H N E E N N F L I D A K I L M N
N E W I K Y F I . N E . N N F L I D A K I L M -
AATTGCATCTTGTCTTCTGTATCT---TCCAAT---AGCAGATTCATCATAAGTAGTTCTGAAATTATG---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P E V W K T S G H V G N F S D P L I E N K I N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K R Y R A D H L I E E F D P L M K I E T L S E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E M E N F I K R N I T K Y E G V A T D W T S I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K F N L M F E T Y Q G I L E D S K N K I Y L R P
- - - - - - - - - - - - - - - - - - - - Y L R P
------------------------------------------------------------AAAATCTCCACG
169170171172173174175176177178179180181182183184185186187188189190191192
E T A Q A I F V N F K N I L R T T R T K I P F G
E T A Q A I F - - - - - - - - - - - - - - - F G
ATTTGCCACTCCCAAAAGTTC---------------------------------------------AGAATA
193194195196197198199200201202203204205206207208209210211212213214215216
V G Q I G K S F R N E V T P G N F I F R T R E F
V G Q I G K S F R N - - - - - - - - - - - R E F
ATGAGATAATTCTTCCTTAGCATGTTTTCT---------------------------------TATCAAAAA
217218219220221222223224225226227228229230231232233234235236237238239240
E Q M E L E Y F V H P N D S D K A F E Y Y L K K
E Q M E L E Y F - - - - - - - - - F E Y Y L K K
TTCATAACATTTTTTTAAATAATA---------------------------ATGAACAAAATATTCTAATTC
241242243244245246247248249250251252253254255256257258259260261262263264
C Y E F L I F L G I K K D L L K I R K H A K E E
C Y E F L I - - - - - - - - - - - - - - - - - -
CATTTGTTCAAATTCTCT------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L S H Y S S A T S D I E F K F D F G W G E L L G
- - - - - - - T S D I E F - - - - - - - E L L G
---------------------TTTAGTTCTTGTAGTTCT---------------------AAAAATAGCTTG
289290291292293294295296297298299300301302303304305306307308309310311312
V A N R G D F D L S S H S K A T N E E L S Y F D
V A N R - - - - - - - - - - - - - - - - - - - -
TGCAGTTTCAGG------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S I E N I T Y I P H V I E P S M G L D R L A L A
- - - - - - - - P H V I E P S M G L D R L A L A
------------------------ATCAGTTGCAACTCCTTCGTATTTAGTAATATTTCTTTTAATAAAATT
337338339340341342343344345346347348349350351352353354355356357358359360
I L T S S Y E E E T L E V D S R V V L K L N K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L V P Y Q I A V L P L V K K F S E E S K E L V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
W L K Q H N F R T T Y D E S A S I G K R Y R R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D A I G T F F A L T Y D Y Q S A E N Q S F T I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N R D T M E Q I R I N K I D L I S Y L T K E L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458
G I
- -
------
Class II
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_gly_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T A P A Q R P T P P A D A A R S M E A L V S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
C K R R G F V F P A S E I Y G G I N G F W D Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P L G T A L K N H V R D H W W H Q T V E C P P L
- - - - - L K N H V R D H W W H Q T V . C P . .
---------------ACGCTTGCCGATGGTCTGCTTGGCGTCGTACTCGCAGGCGAA---CTGGCG------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D P D S G E P L S V L G L D S A I I Q N P K V W
. . . . . . . . S V L G L D S A I I Q - - - - -
------------------------GGGCATCCCGTCCTTGTTCACGAGCGGGAAGAC---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E A S G H V G G F S D P M V D C R E T N G R Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q D Q V E V L F V E G R G A W A F P E N K P D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I A K K L R K A G V T I D D G E V K N L S Q V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E S L Y G T I V A P D T D K A G T L T P P R E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N L M L D T Y P G V I R N E E N K A Y L R P E T
- - - - - - - - - - - - - - - - - - Y L R P E T
------------------------------------------------------GTGGGCCAGCTCGTCGGA
217218219220221222223224225226227228229230231232233234235236237238239240
A Q G I F L N Y L N V L N T M R V K V P F G I A
A Q G I F - - - - - - - - - - - - - - - F G I A
CCCGTGGTCCCGGAA---------------------------------------------CCGCTCGTGCTT
241242243244245246247248249250251252253254255256257258259260261262263264
Q I G K S F R N E V T P R N F I F R S R E F E Q
Q I G K S F R N - - - - - - - - - - - R E F E Q
CCAGAAGTCGTACCACTTGGGCGC---------------------------------CTGCTCGAACTCGCG
265266267268269270271272273274275276277278279280281282283284285286287288
M E M E W F C S E E E A P K W Y D F W K H E R M
M E M E W F - - - - - - - - - Y D F W K H E R M
GGAGCGGAAGATGAAGTT---------------------------CTTGCCGATCTGCGCGATCCCGAAGGG
289290291292293294295296297298299300301302303304305306307308309310311312
R W W E S L G I D Q A N L R F R D H G S D E L A
R W W E - - - - - - - - - - - - - - - - - - - -
CACCTTCACCCG------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H Y S S A C V D V E Y R Y P F T A P G F G E L E
- - - - - C V D V E Y - - - - - - - - - - E L E
---------------CTCGTTGCGGATGACACC------------------------------ACGCGGCGG
337338339340341342343344345346347348349350351352353354355356357358359360
G V A H R G N F D L T A H T R A S N A K L D Y F
G V A H R - - - - - - - - - - - - - - - - - - -
GGTGAGCGTGCCGGC---------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D Q E L Q L R L K A E G V G K D E I K E R S R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T P H V I E P A S G L T R A V L V L L C E A F T
- P H V I E P A S G L T R A V L V - - - - - - -
---GGGGAAGGCCCAGGCTCCTCTGCCCTCGACGAAGAGCACCTCGACCTG---------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P S P E R S G S D Y V M K F K P K F A P V K A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V F P L V N K D G M P E V A H K L Y M E L R Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F A C E Y D A K Q T I G K R Y A R M D E I G T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
F C I A V D G D T L E N N V V T I R D R D T T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522
Q E R V G I D R V A A F L A E K G C
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_gly_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A K D M D T I V S L A K H R G F V F P G S D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y G G L S N T W D Y G P L G V E L K N N V K K A
- - - - - - - - - - - - - - - - L K N N V K K A
------------------------------------------------TTAAAGAATAATGTTAAAAAAGCT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W W Q K F I T Q S P F N V G I D A A I L M N P K
W W Q K F I . Q S . F N V G I D A A I L M - - -
TGGTGGCAAAAATTCATT---CAATCA---TTTAACGTTGGTATCGATGCTGCAATCTTAATG---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V W E A S G H L N N F N D P M I D N K D S K I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y R A D K L I E D Y M Q D V K G D E N F I A D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L S F E Q M K K I I D D E G I V C P V S K T A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
W T E I R Q F N L M F K T F Q G V T E D S T N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I F L R P E T A Q G I F V N Y K N V Q R S M R K
- F L R P E T A Q G I F - - - - - - - - - - - -
---TTCTTACGTCCTGAAACAGCACAAGGTATTTTT------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K L P F G I G Q I G K S F R N E I T P G N F I F
- - - F G I G Q I G K S F R N - - - - - - - - -
---------TTTGGTATCGGTCAAATTGGTAAATCATTCCGTAAT---------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R T R E F E Q M E L E F F C K P G E E I E W Q N
- - R E F E Q M E L E F F - - - - - - - - - Q N
------AGAGAATTTGAACAAATGGAACTTGAATTCTTC---------------------------CAAAAT
241242243244245246247248249250251252253254255256257258259260261262263264
Y W K T F A S D W L T S L N M S S E N M R L R D
Y W K T F A S D W L T - - - - - - - - - - - - -
TATTGGAAAACTTTTGCAAGTGACTGGTTAACA---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H D E D E L S H Y S N A T T D I E Y K F P F G W
- - - - - - - - - - - - T T D I E Y - - - - - -
------------------------------------ACAACTGATATTGAATAT------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G E L W G I A S R T D F D L R K H A E H S G E D
- E L W G I A S R - - - - - - - - - - - - - - -
---GAGTTATGGGGTATCGCAAGTCGT---------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
F R Y H D P E T N E K Y I P Y C I E P S L G A D
- - - - - - - - - - - - - P Y C I E P S L G A D
---------------------------------------CCATATTGTATCGAGCCATCACTTGGTGCAGAT
337338339340341342343344345346347348349350351352353354355356357358359360
R V T L A F L C D A Y D E E G V E G S K D A R T
R V T L A - - - - - - - - - - - - - - - - - - -
CGTGTAACATTAGCT---------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V L H F H P A L A P Y K A A I L P L S K K L S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E A I K I F E Q L S S K F S I D F D E S Q S I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K R Y R R Q D E I G T P Y C V T F D F D S L E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N Q V T V R D R D S M E Q V R M P I S E L E A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463
L T E K T K F
- - - - - - -
---------------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_gly_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A Q E D V F K K L V S H C K E Y G F V F P S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D I Y D G L G A V Y D Y G Q M G V E L K N N I K
- - - - - - - - - - - - - - - - - - L K N N I K
------------------------------------------------------CTGAAAAACAATATTAAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K Y W W D S M V L L H E N I V G I D S A I F M H
K Y W W D S M V L . H . N I V G I D S A I F M -
AAATACTGGTGGGACAGCATGGTGTTG---CAC---AACATTGTCGGTATTGACTCTGCAATCTTTATG---
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P T I W K A S G H V D A F N D P L I D N K D S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K R Y R A D V L I E D Q L A K Y D D K I N K E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A K A A K R F G E A F D E A Q F R S T N G R V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E H Q A K R D A L H E R F A K A L N D N N L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L R Q I I V D E E I A C P I S G T K N W T E V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q F N L M F S T D M G S T A D G S M K I Y L R P
- - - - - - - - - - - - - - - - - - - - Y L R P
------------------------------------------------------------TATCTTCGTCCG
217218219220221222223224225226227228229230231232233234235236237238239240
E T A Q G I F V N Y L N V Q K T G R M K V P F G
E T A Q G I F - - - - - - - - - - - - - - - F G
GAGACGGCACAGGGTATCTTT---------------------------------------------TTCGGT
241242243244245246247248249250251252253254255256257258259260261262263264
I A Q I G K A F R N E I V A R Q F I F R M R E F
I A Q I G K A F R N - - - - - - - - - - - R E F
ATCGCTCAGATCGGTAAAGCTTTCCGTAAC---------------------------------CGTGAGTTC
265266267268269270271272273274275276277278279280281282283284285286287288
E Q M E M Q F F V R P G S E L E Y F K K W K E I
E Q M E M Q F F - - - - - - - - - F K K W K E I
GAACAGATGGAGATGCAGTTCTTT---------------------------TTCAAGAAATGGAAAGAAATT
289290291292293294295296297298299300301302303304305306307308309310311312
R L K W H K A L G F G D D H Y R F H D H D K L A
R L K W H K - - - - - - - - - - - - - - - - - -
CGTTTGAAGTGGCACAAG------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H Y A N A A T D I E F L M P F G F K E V E G I H
- - - - - A T D I E F - - - - - - - E V E G I H
---------------GCTACTGACATTGAGTTC---------------------GAAGTAGAAGGTATTCAC
337338339340341342343344345346347348349350351352353354355356357358359360
S R T N F D L S Q H E K F S G K S I K Y F D P E
S R - - - - - - - - - - - - - - - - - - - - - -
TCCCGT------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L N E S Y T P Y V I E T S I G V D R M F L S I M
- - - - - - P Y V I E T S I G V D R M F L S - -
------------------CCGTACGTAATCGAAACGTCGATCGGTGTTGATCGTATGTTCCTCAGT------
385386387388389390391392393394395396397398399400401402403404405406407408
S A A Y C E E Q L E N G E S R V V L K L P A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A P V K L A V M P L V K K D G L P E K A R E I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D N L K F H F H C Q Y D E K D S I G K R Y R R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D A I G T P Y C V T V D H Q T L E D N C V T L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
N R D T M E Q E R V A I S E L N N I I A D R V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513
I T S L L K T I Q
- - - - - - - - -
---------------------------
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_gly_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P A T S L D Q I V A L A K R R G F I F P S S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y G G L Q G V Y D Y G P L G V E L K N N I I A
- - - - - - - - - - - - - - - - - L K N N I I A
---------------------------------------------------TTGAAGAATAACATCATTGCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D W W R T N V Y E R D D M E G L D A A I L M N R
D W W R T N V . E R D . M E G L D A A I L M - -
GATTGGTGGCGGACGAATGTG---GAACGTGAC---ATGGAGGGTCTCGATGCGGCAATCTTGATG------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L V W K Y S G H E E T F N D P L V D C R T C K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R W R A D H I H G V C P N C G S R D L T E P R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F N M M F R T Q I G P V A D S S S F A Y L R P E
- - - - - - - - - - - - - - - - - - - Y L R P E
---------------------------------------------------------TACTTGCGCCCCGAA
145146147148149150151152153154155156157158159160161162163164165166167168
T A Q G I F V N F A N V L A T T A R K L P F G I
T A Q G I F - - - - - - - - - - - - - - - F G I
ACGGCACAAGGCATTTTC---------------------------------------------TTTGGGATT
169170171172173174175176177178179180181182183184185186187188189190191192
A Q V G K A F R N E I T P R N F I F R V R E F E
A Q V G K A F R N - - - - - - - - - - - R E F E
GCCCAAGTCGGCAAGGCGTTTCGCAAC---------------------------------CGTGAATTCGAG
193194195196197198199200201202203204205206207208209210211212213214215216
Q M E I E Y F V M P G T D E E W H Q R W L E A R
Q M E I E Y F - - - - - - - - - H Q R W L E A R
CAGATGGAGATTGAGTATTTT---------------------------CATCAGCGGTGGCTTGAGGCCCGA
217218219220221222223224225226227228229230231232233234235236237238239240
L A W W E Q I G I P R S R I T I Y D V P P D E L
L A W W E - - - - - - - - - - - - - - - - - - -
TTGGCGTGGTGGGAG---------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A H Y S K R T F D L M Y D Y P N I G V Q E I E G
- - - - - - T F D L M Y - - - - - - - - E I E G
------------------ACGTTCGACCTTATGTAC------------------------GAGATCGAGGGC
265266267268269270271272273274275276277278279280281282283284285286287288
I A N R T D Y D L G S H S K D Q D Q L N L T A R
I A N R - - - - - - - - - - - - - - - - - - - -
ATCGCTAACCGT------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V N R N E D S L A R L T Y F D Q A S G R H V V P
- - - - - - - - - - - - - - - - - - - - - - - P
---------------------------------------------------------------------CCG
313314315316317318319320321322323324325326327328329330331332333334335336
Y V I E P S A G V G R C M L A V M C E G Y A E E
Y V I E P S A G V G R C M L A - - - - - - - - -
TATGTGATCGAGCCATCAGCCGGGGTAGGACGTTGTATGCTGGCG---------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L T K P I P T E K L T A V G D A L Q T F L K S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G R S E K I G G E A R D A I L A R G E A L Q Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L T E R L P E V E Q L L A M P G A D Q I E V G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K L R G Q V Q P L I D E H Y R T V L R L K P R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A P I K A A V F P L K R N H E Q L V T T A K A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R R Q L Q V G G E M R T V Y D D T G A I G K L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R R Q D E I G T P F C I T V D F D T I G Q G K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P S L A G T V T V R D R D T M A Q E R V P I S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539
L E G Y L R E K L R A
- - - - - - - - - - -
---------------------------------
Class II
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_gly_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T V R P F D C L T L R R S H M P A T S M E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V S L C K R R G F I F Q G S E I Y G G L Q G F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D Y G P L G V E L K N N I K A A W W R S N V Y E
- - - - - - - - L K N N I K A A W W R S N V . E
------------------------CTGAAGAACAACATCAAGGCGGCGTGGTGGCGCTCCAACGTC---GAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R D D M E G L D A S I I M H R M V L R H S G H E
R D . M E G L D A S I I M - - - - - - - - - - -
CGCGAC---ATGGAAGGGCTGGACGCCTCCATCATCATG---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A T F S D P M I D N K K N N K R Y R L D H L L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D Q K A D V Q A K V A E I M G E S A D N F A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V A A L N A K P A Q A S A A F K E A G V R D P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S G E V G E W T D P K P F N M M F R T T I G P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A D E E S Y G Y L R P E T A Q G I F T N F K N V
- - - - - - - Y L R P E T A Q G I F - - - - - -
---------------------TACCTGCGTCCCGAAACCGCGCAGGGCATCTTC------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V D S T S R R L P F G I A Q I G K A F R N E I T
- - - - - - - - - F G I A Q I G K A F R N - - -
---------------------------TTCGGCATCGCGCAGATCGGCAAGGCGTTCCGCAAC---------
241242243244245246247248249250251252253254255256257258259260261262263264
P R N F I F R V R E L E Q M E I E F F V T P G T
- - - - - - - - R E L E Q M E I E F F - - - - -
------------------------CGTGAGCTAGAGCAGATGGAAATTGAGTTCTTC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
D E E W H E H W L E K R L K W W E D Q G V P R E
- - - - H E H W L E K R L K W W E - - - - - - -
------------CACGAGCACTGGCTGGAAAAGCGCCTGAAATGGTGGGAA---------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K I E I L D V P K E D L A H Y S K R T Y D L M Y
- - - - - - - - - - - - - - - - - - T Y D L M Y
------------------------------------------------------ACCTACGACCTGATGTAC
313314315316317318319320321322323324325326327328329330331332333334335336
D Y P T L G H E E I E G I A N R S D Y D L G S H
- - - - - - - - E I E G I A N R - - - - - - - -
------------------------GAAATCGAGGGCATCGCCAACCGC------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T K S Q S E L G L V A K V E E N N D S I A K L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I P H P E T N K P V V P F V I E P S A G V D R A
- - - - - - - - - - - P F V I E P S A G V D R A
---------------------------------CCGTTCGTGATCGAGCCGTCGGCGGGGGTAGACCGGGCG
385386387388389390391392393394395396397398399400401402403404405406407408
M L A V L S E A F T K E T L E N G N E R I V L K
M L A - - - - - - - - - - - - - - - - - - - - -
ATGCTGGCG---------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L K P H L A P I K V A V I P L A R N R E E I T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V A K A I K A E L Q G L G L G R V L Y E D S G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I G K A Y R R H D E V G T P Y C V T V D F D T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G L G E N T D E S L K D T V T V R D R D T L A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521
E R V K I S E L A G W I Q A K L R
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_gly_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V R M E D I I S L A K R K G F V F Q S S E V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G G L S G A W D Y G P L G V E L K K N I K K E W
- - - - - - - - - - - - - - - L K K N I K K E W
---------------------------------------------ATCCTCAATCGTATTGTAATCTATTGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W K S M V Y L H E N I V G L D S A I F M R P E I
W K S M V . L H . N I V G L D S A I F M - - - -
TACGCAATAAGGAGT---TATTTC---TTGACGTCTATACCTTTTACCTATTGTTCCACT------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W R A S G H V D G F S D S M V D C K D C K S R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R A D F I D L S K N C P N C K V G N N F T S P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S F N L M F K T H I G V V E D S S S E V Y L R P
- - - - - - - - - - - - - - - - - - - - Y L R P
------------------------------------------------------------AGAAGTCTCAAT
145146147148149150151152153154155156157158159160161162163164165166167168
E T A Q G I F V N F R N V L D S S R L K I P F G
E T A Q G I F - - - - - - - - - - - - - - - F G
AACATAAGGCACATATTTCTC---------------------------------------------AAATTT
169170171172173174175176177178179180181182183184185186187188189190191192
I A Q V G K A F R N E I V T K N F I F R T C E F
I A Q V G K A F R N - - - - - - - - - - - C E F
AGCGTGCTGAGTTAAATCATAATTACCTCT---------------------------------CGGAAATTC
193194195196197198199200201202203204205206207208209210211212213214215216
E Q M E M Q F F V H P K Q I D E W F C Y W Q Q N
E Q M E M Q F F - - - - - - - - - F C Y W Q Q N
ATACTCAATATCAAATGCAGCTTT---------------------------ATGCGCCTTAAATCTTAATCT
217218219220221222223224225226227228229230231232233234235236237238239240
R M N F F I E T L K I S P D R L R F K A H D S T
R M N F F I - - - - - - - - - - - - - - - - - -
ATCGGGACTAATTTTAAG------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Q L A H Y A K A A F D I E Y E F P F G F Q E V E
- - - - - - - - A F D I E Y - - - - - - - E V E
------------------------CTGCATTTCCATTTGCTC---------------------AAAATTTTT
265266267268269270271272273274275276277278279280281282283284285286287288
G I H N R G N Y D L T Q H A K F S N K P K V F E
G I H N R - - - - - - - - - - - - - - - - - - -
AGTAACTATCTCATT---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y H D L L T K E K Y V P Y V I E T S A G L T R S
- - - - - - - - - - - P Y V I E T S A G L T R S
---------------------------------TGCTGTCTCAGGCCTTAAATAAACTTCACTAGAACTATC
313314315316317318319320321322323324325326327328329330331332333334335336
V L M T L C D A Y S E E E L S D G D K R I V L R
V L M - - - - - - - - - - - - - - - - - - - - -
CTCCACTAC---------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L H P K L A P Y K I A I F P L V K K V E L T E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A R R I Y M E L C D D F H I F Y D D S G T I G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R Y R R Q D E I G T P Y C V T I D Y N T I E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T V T V R E R N S M T Q K R I F I N D L Y S Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445
K T E I L N Y K E D F N K
- - - - - - - - - - - - -
---------------------------------------
Class II
Eukaryotes/Dictyostelium discoideum/amino acid sequences/Ddiscoideum_gly_aa
Eukaryotes/Dictyostelium discoideum/nucleotide sequences/Ddiscoideum_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I L L K S L I N K S S L S S P S F K S I N K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L T F K N I N N Y Y T T T T T T T S L N L K S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I L F N N S D N K M S I D N K E K I R A G L E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L M K R R F F I T Q S F S I Y G G Q A G L Y D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G P P G C A V K A N L I N L W R Q H F V L N E D
- - - - - - V K A N L I N L W R Q H F . L N E D
------------------GTCAAAGCAAACCTTATCAACCTTTGGAGACAACATTTC---TTAAATGAAGAT
121122123124125126127128129130131132133134135136137138139140141142143144
M S E V D C V S V T P E Q V L K A S G H V A K F
M S E V D C V S V T - - - - - - - - - - - - - -
ATGTCCGAAGTTGATTGTGTTTCTGTAACA------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A D F M V K D E V T K A F F R A D H I L E A H I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q T L L K D T S K M S K E Q I E E L N F V L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A G D Y N Q E Q L K E S L I K Y N V K A P E T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N A L T E P Y P F N L M F Q T Q I G P S G L S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G Y L R P E T A Q G I F T N F G K L Y E Y N G K
- Y L R P E T A Q G I F - - - - - - - - - - - -
---TACCTTCGTCCAGAGACAGCACAAGGTATTTTC------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K L P F A A A Q I G N A F R N E I A P R A G L L
- - - F A A A Q I G N A F R N - - - - - - - - -
---------TTTGCCGCCGCACAAATTGGTAATGCCTTTAGAAAT---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R V R E F T M A E I E H F V N P N N K T H P K F
- - R E F T M A E I E H F - - - - - - - - - - -
------AGAGAGTTTACAATGGCCGAGATTGAGCATTTC---------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N E I K D V E A N L L S S D S Q D K T S E I Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
C T F G E A V E K K L I D N E T L A Y F M A R T
- - - - - - - - - - - - - - - - L A Y F M A R T
------------------------------------------------CTCGCTTACTTTATGGCTCGTACT
361362363364365366367368369370371372373374375376377378379380381382383384
Q Q F L H T V G I K P A G L R F R Q H Q K N E M
Q Q F L H - - - - - - - - - - - - - - - - - - -
CAACAATTCCTTCAC---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A H Y A Q D C W D A E I L S S Y G W V E C V G H
- - - - - - C W D A E I - - - - - - - E C V G H
------------------TGTTGGGATGCTGAAATC---------------------GAATGTGTAGGTCAT
409410411412413414415416417418419420421422423424425426427428429430431432
A D R S C Y D L K V H A T E S K S N L S A Y E E
A D R - - - - - - - - - - - - - - - - - - - - -
GCCGATCGT---------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
F K E P Q F V D I A K V V V N P G A I S K K H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A A V S P I K K Y L T E L K D D L A K A L E I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E T I T K D G S Y N L V L D G N T Y D I T A D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V T I S K A Q E K K N G H T F F P H V I E P S F
- - - S . . . . . . . . . . . . . H V I E P S F
---------AGT---------------------------------------CATGTCATTGAACCATCATTT
529530531532533534535536537538539540541542543544545546547548549550551552
G L G R I I Y S I L E Q N Y Y T R E N D E Q R G
G L G R I I Y S - - - - - - - - - - - - - - - -
GGTTTGGGTCGTATCATTTACTCA------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V L S L P A I I A P V K A S I L P L T S S D R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A P F V Q T I S K A L K E A N I S T K V D D T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N A I G R K Y A R T D E I G V P F G V T I D F Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
T V E D N T V T L R E R D T T K Q V R I P I S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L A S T L R K L C D L T V S W S D I L K T F P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678
Y E G Q S E
- - - - - -
------------------
Class II
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_gly_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E S S F A N V L V R R F F V V P A F E I Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G V A G L Y D L G P S T T E L R N N F L S M W R
- - - - - - - - - - - - - - L R N N F L S M W R
------------------------------------------TTGCGCAACAATTTCCTGAGCATGTGGCGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q H F V V A E D M L E I M C T N I V P D K V L Q
Q H F V . A E D M L E I M C T N I V - - - - - -
CAACACTTTGTC---GCTGAAGATATGCTCGAGATAATGTGCACCAATATTGTT------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A S G H V A R F A D V M V K D T K N G E C F R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D K L I E S Y L E K K L A A E G K S L D E D Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K A L N S L L N S V D G A S P E V I K E L I Q S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M H V L S P S G N P L S D P F P F N L M F Q T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I G P S A G S T V Y L R P E T A Q G I F M N F K
- - - - - - - - - Y L R P E T A Q G I F - - - -
---------------------------TATCTAAGGCCTGAGACTGCACAAGGCATATTC------------
193194195196197198199200201202203204205206207208209210211212213214215216
R G L E Q A K Q L P F A M A Q V G T V F R N E I
- - - - - - - - - - F A M A Q V G T V F R N - -
------------------------------TTTGCCATGGCGCAGGTTGGAACAGTTTTTCGCAAT------
217218219220221222223224225226227228229230231232233234235236237238239240
S P R N S L L R V R E F E Q C E I E H F I D G T
- - - - - - - - - R E F E Q C E I E H F - - - -
---------------------------CGTGAATTCGAACAGTGTGAGATTGAGCATTTC------------
241242243244245246247248249250251252253254255256257258259260261262263264
P D S F R H P K I S T V A W C Y V E L F T A D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q L A G L P C G K K M S I Q N A L D N K V L A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E T M A Y F I G R T Y L F L L K L G L D P A R L
- - M A Y F I G R T Y L F L L - - - - - - - - -
------ATGGCATACTTTATCGGTCGCACATACCTCTTTCTACTG---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R F R Q H L P K Q L A H Y A R D C W D C D C L L
- - - - - - - - - - - - - - - - C W D C D C - -
------------------------------------------------TGCTGGGACTGTGACTGC------
337338339340341342343344345346347348349350351352353354355356357358359360
S C G W T E I V G I A D R S A Y D L Q V H S K A
- - - - - E I V G I A D R - - - - - - - - - - -
---------------GAGATTGTCGGAATCGCAGACCGT---------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S G V D L T C F L K Y P E P R E V S Y N I C T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K M K E C A K V F K Q D V N L I R S T I E A I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G E D L E V L K A E L Q S T G S Y T L R I P G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D G E A E K D F E I L P N Y V Q F N C D T K M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
H G E S I V P H V I E P S F G V G R I L Y S I L
- - - - - - P H V I E P S F G V G R I L Y S - -
------------------CCCCACGTTATCGAGCCTTCCTTCGGGGTTGGCAGGATCCTTTATTCG------
481482483484485486487488489490491492493494495496497498499500501502503504
E H S F Y T R N I D E Q R T V F R F K P Y L V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
C K A I V L P L Q R N D D L L S T S S H V L E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L R R S G I A A K Q D A T G A P I G R R Y A R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D E I G I P F A V T I D F Q T L E D G S V T I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E R D S M D Q I R V G S K Q L S Q V I A N L S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621
G K V Q W S T V Y K H F P R C E A T N A E
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_gly_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P A A S S L P A K L E G F V R T E F E D T C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R R F F Y G L A F D P Y G G T A G L Y D L G P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M C A M K S N M L H F W R Q H F V I E E S M C E
- - - M K S N M L H F W R Q H F . I E E S M C E
---------ATGAAGAGCAACATGCTTCATTTCTGGCGCCAGCACTTC---ATCGAGGAGAGCATGTGCGAG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V D T T C L T P E E V F K A S G H V T R F N D V
V D T T C L T - - - - - - - - - - - - - - - - -
GTGGACACGACCTGCCTCACG---------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M V R D T V T G E C I R A D K F L E E W S E A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I E K D G I T A E Q K D E F L H L L H D A A G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N P S Q I K A V L E K H A I K S P K G N P F S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P F P F N L M F A T H I G P E G D R L G Y M R P
- - - - - - - - - - - - - - - - - - - - Y M R P
------------------------------------------------------------TACATGCGCCCC
193194195196197198199200201202203204205206207208209210211212213214215216
E L A Q G I I L N F K R L M D S G N A Q R M P F
E L A Q G I I - - - - - - - - - - - - - - - - F
GAGCTGGCTCAGGGCATCATC------------------------------------------------TTT
217218219220221222223224225226227228229230231232233234235236237238239240
A G A C I G T A F R N E I A P R S A L I R V R E
A G A C I G T A F R N - - - - - - - - - - - R E
GCCGGTGCTTGCATCGGGACCGCCTTCCGTAAC---------------------------------CGCGAG
241242243244245246247248249250251252253254255256257258259260261262263264
F T L A E I E H F V N P N N K N H E K F D R V R
F T L A E I E H F - - - - - - - - - - - - - - -
TTTACGCTGGCGGAGATCGAGCACTTT---------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D V E I W A W P R N L Q A S N E D P I R M T I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E A V Q A K V I D N Q T L G Y F I G R V A L F L
- - - - - - - - - - - - L G Y F I G R V A L F L
------------------------------------CTCGGCTACTTCATTGGACGCGTCGCGCTTTTCCTC
313314315316317318319320321322323324325326327328329330331332333334335336
T S V G V R F Y R F R Q H Q S T E M A H Y A Q D
T - - - - - - - - - - - - - - - - - - - - - - -
ACG---------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
C W D A E L L T S Y G W I E C V G I A D R S A Y
C W D A E L - - - - - - - E C V G I A D R - - -
TGCTGGGACGCGGAGCTG---------------------GAGTGCGTTGGCATTGCGGACCGC---------
361362363364365366367368369370371372373374375376377378379380381382383384
D L T Q H S N A S K K D L C A R E E Y N E P C M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E R Q L L R Q L T K G L I G K T F G K K A G E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
M A Y L N S A P A E A C E A I R A A H A A G Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A T V A L P S G E E V S I T A Q M V S F E E K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
V K V T G Y S Y T P S V I E P S F G I G R I L Y
- - - - - - S . . . S V I E P S F G I G R I L Y
------------------AGC---------AGTGTGATCGAGCCGTCCTTCGGCATCGGCCGCATCCTGTAC
481482483484485486487488489490491492493494495496497498499500501502503504
C L L E Q S Y W V R R D D G G K N D K R A V F S
C - - - - - - - - - - - - - - - - - - - - - - -
TGC---------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F S P L L A P Q K V A L L P L M V K P E L L A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I S E I R Q E L V M R G I S V R V D D S S V T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G K K Y A R V D E L G I P F A I T C D F E G D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
S V T L R E R D T A S Q V R V P K S E V A S I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
V E L C N P L Q P L T W D S V K A K Y P A Q A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628
A A E K
- - - -
------------
Class II
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_gly_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K F E T E K L E K I I K S R F L L N Q T A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y G G V S G L Y D I G P V L F G I K Q N F T S
- - - - - - - - - - - - - - - - - I K Q N F T S
---------------------------------------------------AATAGTTACCTTTTTATCAAC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E W R K H F V Y Y D K L Y E V E S S I L L P Y S
E W R K H F . Y Y D K L Y E V E S S I L L - - -
AAGAGAATCATTATCAAA---CACAAAATAAGGAATACCAATTTCATCGCAGGAAGCATATTT---------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L K A S G H V D K F C D I L I C D K N N G L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y R A D H Y I E A F L S K L P H S D E I S Q E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K M V D C M N C K D I D K I I Q K Y N I K T P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G N E F S P S I K F N L M F E T N L G Y K E G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S V F L R P E T A Q G Q F L N F K K L Y E F N N
- - F L R P E T A Q G Q F - - - - - - - - - - -
------ACTATTTTCATTAAAAACAAAATTGATATAAAA---------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K K L P F G S A T I G K A F R N E I S P R S G L
- - - - F G S A T I G K A F R N - - - - - - - -
------------TAACGAATTTAACTCATTAGAAAACTGTTCATAGTC------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I R T R E F E Q A E I E Y F V N P K E K T F K K
- - - R E F E Q A E I E Y F - - - - - - - - - -
---------GATTATAGGCTTCAATTCTTCTTTTATAACCGG------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F K T V N T L V L L L C F D N Q E V K M S L E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A V N N K I I N N E I L G Y F M G R T Y L F L A
- - - - - - - - - - - L G Y F M G R T Y L F L A
---------------------------------ATCTTTAGCGTAATGTGCCATCTCATCCTTCTTATGTTG
289290291292293294295296297298299300301302303304305306307308309310311312
N I G I D S T L I R F R Q H K K D E M A H Y A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D C W D C E I Y S S F G W V E C V G I A D R S A
- C W D C E I - - - - - - - E C V G I A D R - -
---GATCTCATTATTGATAAT---------------------TAGAGACATTTTAACTTCTTGATT------
337338339340341342343344345346347348349350351352353354355356357358359360
Y D L T C H S Q A S G T E L C F S E K C I P P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I K E E L K P I I D K K S W I K I L K K D Y E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F S N E L N S L S S K F I Q D N M F K E N D K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y I N F V F N E N S Y K I E C S Q I R T T I H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q K D I P D V I E P S F G I G R I L Y I L L E H
- - - - - D V I E P S F G I G R I L Y I - - - -
---------------AGAAGGAGAAAATTCATTACCATCAGGTGTTTTTATATTGTATTT------------
457458459460461462463464465466467468469470471472473474475476477478479480
S F Y L R E C G R P V L Q L K P K I A S T K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I S Y V V Q N A V F T S Y I N N I L D Q L Y D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
N I V A E V N E R S C S I G K K Y A S C D E I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I P Y F V T F D N D S L V D K K V T I R E R D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
M E Q V R L N I S D V S G I I C N L I N E K I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587
W E E L K F N N L K F
- - - - - - - - - - -
---------------------------------
Class II
Eukaryotes/Naegleria gruberi/amino acid sequences/Ngruberi_gly_aa
Eukaryotes/Naegleria gruberi/nucleotide sequences/Ngruberi_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K E I N Q I T K E W N R A N P D K L H I N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E E F N E L L T R R F F V I P S F E I Y G G V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G L Y D Y G P P A C A I K A N I L D L W R R H F
- - - - - - - - - - - I K A N I L D L W R R H F
---------------------------------ACCAGCTGTCACACTGTTGTCATCAATAGTGATGGCAAA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V N E E N M L E V D C S S L T P E T V F V A S G
. N E E N M L E V D C S S L T - - - - - - - - -
---AATACCAATATCATCAGCACGAGCATACTTCTTACCAATGTT---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H V Q R F A D W M V K D V V T N D C F R A D K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V G E F I D T E L E E N S E L T Q E K T E E Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L V K K K I D D Y D G K G L D E L I Q K Y G I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S P T T G N E L S A S Y P F N L M F S T P I G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T G K L K G Y L R P E T A Q G I F V N F K R L L
- - - - - - Y L R P E T A Q G I F - - - - - - -
------------------CTTATCGATAGATTCAACTCTGAAAGAAATCTT---------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E Y N G K Q M P F A S A Q I G Q A F R N E I S P
- - - - - - - - F A S A Q I G Q A F R N - - - -
------------------------AGTGAGGGAATTCAAATAAGTCATAACTGGTTCGAC------------
241242243244245246247248249250251252253254255256257258259260261262263264
R S G L L R V R E F T L A E I E H F L N P D V D
- - - - - - - R E F T L A E I E H F - - - - - -
---------------------GACTGGTTCGACAGCAACGAATTCTTCAACAGT------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E H P K L D T I S S I R V P F F S R E N Q T Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L N P V D L T I A E A M E K G W L T N K T H A Y
- - - - - - - - - - - - - - - - - - - - - H A Y
---------------------------------------------------------------AGCCATTTC
313314315316317318319320321322323324325326327328329330331332333334335336
Y I A R V K L F M D E C G V L P T A I R F R Q H
Y I A R V K L F M D - - - - - - - - - - - - - -
GTTAGCCAAATGTTGACGGAATCTGATAGC------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L A N E M A H Y A R D C W D C E L L T S Y G W I
- - - - - - - - - - - C W D C E L - - - - - - -
---------------------------------CCATCCTTTTTCCATAGC---------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E V V G I A N R S C F D L E N H S K Y S K N E L
E V V G I A N R - - - - - - - - - - - - - - - -
TGGGTTCAAACCTTGAGTTTGATT------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V A Y E S F E T P T V E E F V A V E P V K Q K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G K I L K G D V E P V M T Y L N S L T D Q E R L
- - - - - - - - - - - - - Y . . . . . . . . . .
---------------------------------------AAT------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D L Q K Q L D E T G K I S F R V E S I D K T I E
. . . . . . . . . . . . . . . . . S . . . . . .
---------------------------------------------------TGG------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L T K D L I A F P K R E K K I L G R N Y T P G V
. . . . . . . . . . . . . . . . . . . . . . . V
---------------------------------------------------------------------AGT
481482483484485486487488489490491492493494495496497498499500501502503504
I E P S F G I G R I I Y C L L E H S Y W V R P K
I E P S F G I G R I I Y C - - - - - - - - - - -
AGTTGGACTCTTAATACCATATTTTTGGATGAGTTCATC---------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q E H E K E E D K I Q R A V L S L P P A I A P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K V A L L P I K A D Q D Q I V K K L Q Q S L A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y G I S H R V D A G N Q N I G K K Y A R A D D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G I P F A I T I D D N S V T A G T V T I R E R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
S C E Q V I V P I S D L I T V L N D L I D R I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
L W E D I K Q A Y P E Q K Q T A S D K V G K K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650
V K
- -
------
Class II
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_gly_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_gly_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N R K T L I E R R E A L E N L L K R R F F I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P S F E I Y G G V A G L F D Y G P P G C A L K S
- - - - - - - - - - - - - - - - - - - - - L K S
---------------------------------------------------------------TTAAAGTCA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E V E S F W R R H F V L A E D M L E I S A T C L
E V E S F W R R H F . L A E D M L E I S A T C L
GAAGTTGAGAGTTTCTGGAGAAGACATTTT---TTAGCTGAAGATATGTTGGAGATTAGTGCAACTTGTTTA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T P Y N P L K A S G H V D R F T D S M I T D I K
T - - - - - - - - - - - - - - - - - - - - - - -
ACT---------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T N E Y Y R A D K V L E E Y V E N R L K E K S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N P P K S E E E K N E L E T L G I K A G S M S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D E I K E S L N K Y Q I K P P S G G E W S E P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P F N L M F R T K I G P K E V E G K N D S V G F
- - - - - - - - - - - - - - - - - - - - - - - F
---------------------------------------------------------------------TTT
193194195196197198199200201202203204205206207208209210211212213214215216
M R P E T A Q G I F V N F K R L Y E Y N G K K L
M R P E T A Q G I F - - - - - - - - - - - - - -
ATGAGACCTGAAACCGCACAAGGAATTTTT------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P F S V A Q I G L G F R N E I A P R N G L L R V
- F S V A Q I G L G F R N - - - - - - - - - - -
---TTTTCAGTAGCTCAAATTGGTTTGGGATTTAGAAAT---------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R E F Q M A E I E H F I H P D R K D H P K F D D
R E F Q M A E I E H F - - - - - - - - - - - - -
AGAGAATTCCAGATGGCAGAAATTGAACATTTT---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V A L K C L P L Y S S K T Q L N N G E I E R N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T L K E A V H G E E K I I N N E T L A Y F L S R
- - - - - - - - - - - - - - - - - L A Y F L S R
---------------------------------------------------TTAGCTTATTTCTTATCTAGA
313314315316317318319320321322323324325326327328329330331332333334335336
T Y D F L I S I G I N P D G I R F R Q H L S T E
T Y D F L I - - - - - - - - - - - - - - - - - -
ACTTATGATTTTCTTATT------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
M A H Y A S D C W D A E V L T S Y G W I E C A G
- - - - - - - C W D A E V - - - - - - - E C A G
---------------------TGCTGGGATGCTGAAGTA---------------------GAATGTGCTGGT
361362363364365366367368369370371372373374375376377378379380381382383384
H A D R S C Y D L L Q H S K A T K T D L F A S E
H A D R - - - - - - - - - - - - - - - - - - - -
CATGCTGATAGA------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K Y D E P Q F K T V L V L T L N K P L I G K T F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K Q E A S L V T E A L Q E I A N K G D I S F Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K L N Q S N K A L L K Y K S C E N G K E Y Q W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I S S E M A K F E F Q T K K V T E E Q F T P G V
- - - - - - - - - - - - - - - - - - - - - P G V
---------------------------------------------------------------CCTGGTGTT
481482483484485486487488489490491492493494495496497498499500501502503504
I E P S F G I G R I I Y C L L E H S F K I R E D
I E P S F G I G R I I Y C - - - - - - - - - - -
ATTGAACCTTCATTTGGAATTGGAAGAATAATATATTGT---------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L S E I Q D Q S T G N K N T N N S P D N E M Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S Y L S L P A L I A P V K C S I L P I S S N A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
F N D L I N L L H K S F I N H G I S C K V D T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
S A S I G R R Y A R T D E I G I P F G I T I D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Q S V K D D T V T L R E R D S M K Q V R I S S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E V P S V I S K I I N Q Q I T W E N V L E N Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656
L F T Q Q S N E
- - - - - - - -
------------------------
Class II
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_his_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T Q I V L E P L R G F R D I L P P E S R A L S
- - - - - - - - - - - - - - - - - - - - - A L S
---------------------------------------------------------------ATCGCGTAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R L A E I F T E V A E A Y G Y R E V K P P T L E
R L A E I F T E V A E A Y G Y R E V K P P T L E
AACAACTTTCTCTTCTGCAGCCTCTTTTCTCCCTATTATAACAGCATAACGATAACCTTGTTTGGCTAACTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R F Q L F A V K S G E E I R R S M Y V F K D K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R E V A L R P E A T A S I A R I Y L K H L R G
- - - - A L R P E A T A S I A - - - - - - - - -
------------TGCGTATCCTGCAAGCGCTTCATCAAGAACTAT---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E P K P L R L Y Y V V N C F R Y E E P Q K A R Y
- - - - L R L Y Y V V N C F R Y - - - - - - - -
------------TGACAATCCTAGCTCTTGTATCGCTGCTAGTGTTCT------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R E F W Q A G I E L L G E P S I L G D F E V I R
R E F W Q A G I E L L - - - - - - - D F E V I R
CCCTGGCACCTTTTCCCCGCCATAGAGTTCAAT---------------------ACCTGCTATGCTTACAGG
145146147148149150151152153154155156157158159160161162163164165166167168
I L V K F Y E R I E M L D H I V L K I G T T K L
I L V K F Y E - - - - - - - - - - - - - - - - -
GAAACCGGGAACCTTGACTTC---------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y R H L F S K Y N I S E D I Q D H I L H L M D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D L Y N E A I N V L L E T D S P E L A D L L E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L W S R A R N N I E E A K K I V A K A S E E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G I L E E F N K L I K M L R E Y N N Q L R L D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D L A F A R G L A Y Y T G T I F E V K V P G F P
- - - - - - - - - - - - - - I F E V K V - - - -
------------------------------------------TATGCGTTCATAGAACTT------------
289290291292293294295296297298299300301302303304305306307308309310311312
V S I A G G G R Y D N L I E L Y G G E K V P G T
- S I A G G G R Y - - - - - - - - - - - V P G T
---GACTTCAAAGTCTCCTAGGATCGA---------------------------------GAACTCTCTATA
313314315316317318319320321322323324325326327328329330331332333334335336
G F A I G L D R T L A A I Q E L G L S P K L V Y
G F A I G L D R T L A A - - - - - - - - - - - -
TCTCGCCTTCTGTGGCTCTTCATACCTGAAACAGTT------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E D K V P I A I I V L D E A L A G Y A A R V Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I L A A K S T V T T S M Y V S P K L Q K I L P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L A K Q G Y R Y A V I I G R K E A A E E K V V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430
R D L L Q R R Q D I V S L D E L S N V E F K
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_his_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E I E K F I F E T A S S V A E S Y G F K R I D
- - I E K F I F E T A S S V A E S Y G F K R I D
------GCTTGTGCTCTTTTCAAGGAATGGAACTAAATCGCCTAGTGTTACAATTTCCTGTTCTCCAGTCGA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F P S L E Y I D L Y R I K S G E E L L N Q T Y S
F P S L E - - - - - - - - - - - - - - - - - - -
GAGATCTCTTACTGT---------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F T D R G G R E V T L I P E A T P S T V R M L T
- - - - - - - - - T L I P E A T P S T V - - - -
---------------------------AAGCGACCTATCCATTATCTCTGCAGATACAAT------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S R K D I A K P V R W Y S F P K V W R Y E E P Q
- - - - - - - - V R W Y S F P K V W R Y - - - -
------------------------AATCCTCTCCGCTTTCACTGTTCCAACCCTGCATAC------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A G R F R E H Y Q F N A D I F G P S N E E A D A
- - - - R E H Y Q F N A D I F - - - - - - - D A
------------TGCCTTCACACCCTTGCTCTTAAGGAGCAGCGA---------------------AAATCC
121122123124125126127128129130131132133134135136137138139140141142143144
E I I S L A S G I L D G L G L S G A Y E I R V N
E I I S L A S G I L D - - - - - - - - - - - - -
AACTGCAGGTATGTCTTGTTCTGAAAATAGCTT---------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S R I M M E D I L N G M G I A D P Y T V F S I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D R F H K V S K E T F V D D L M S V G L S E E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S N T I Y R M C S E A S E P G G I S G L F G S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K V S K A A E R L I R T I D I L K E Y G V K S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K Y D F S I V R G L S Y Y T G L V F E A Y D K S
- - - - - - - - - - - - - - - - V F E A Y D - -
------------------------------------------------GCCGTTCAATATGTCTTC------
265266267268269270271272273274275276277278279280281282283284285286287288
G Q F R A I L G G G R Y D N L A K L F S E Q D I
- - - - A I L G G G R Y - - - - - - - - - - - I
------------AACTCTTATTTCGTACGCTCCGGA---------------------------------GGA
289290291292293294295296297298299300301302303304305306307308309310311312
P A V G F G M G D A V I S L L L K S K G V K A P
P A V G F G M G D A V I S L L - - - - - - - - -
GATTATCTCAGCGTCAGCTTCCTCATTGCTTGGGCCGAAAATATC---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H A K K S V Y V C R V G T V K A E R I A S I S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
M L R S S G F I V S A E I M D R S L S S Q L K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A S Y E G C E Y A V I A G E R D L E N N S V T V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R D L S T G E Q E I V T L G D L V P F L E K S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410
S Y
- -
------
Class II
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_his_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F N R P K G T R D F A P S E M K K R K I I E N
- - - - - - - - - - - - - - - - - K R K I I E N
---------------------------------------------------AAAAGAAAAATAATTGAAAAT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K L K S V F M A Y N F N E I N T P T F E Y F E L
K L K S V F M A Y N F N E I N T P T F E - - - -
AAATTAAAAAGCGTATTTATGGCATATAATTTCAATGAGATAAACACCCCCACATTTGAA------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L S K K T G E D I R K Q L F V F K D H G N R E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G L R P E I T S S V V R F Y I N E L K N L P K P
G L R P E I T S S V V - - - - - - - - - - - - -
GGACTTAGACCAGAAATAACCTCCTCAGTGGTT---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q K L F Y F A N C F R Y E Q P Q A G R Y R E F W
Q K L F Y F A N C F R Y - - - - - - - - R E F W
CAAAAATTATTTTATTTTGCCAACTGTTTTAGGTAT------------------------AGGGAATTTTGG
121122123124125126127128129130131132133134135136137138139140141142143144
Q M G C E L L G S K N P I A D A E V I N L A M D
Q M G C E L L - - - - - - - D A E V I N L A M D
CAAATGGGATGCGAGTTATTG---------------------GATGCAGAAGTTATAAATTTAGCTATGGAC
145146147148149150151152153154155156157158159160161162163164165166167168
G L N K I N M D Y E I H I G H L G V L K G V F E
G L N - - - - - - - - - - - - - - - - - - - - -
GGATTGAAT---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E F G L T E D E E L K I R R L I D K E D Y E N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E K C L I E L E E N K N I I I K D I I F S V L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S K G T V E E V I G N L K E I L K N Y P K S I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A L N N L E E I M E F V K R N N Y I I N L G I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R G L D Y Y T G M V F E V Y G K K E G A R Q V C
- - - - - - - - - V F E V Y G - - - - - - Q V C
---------------------------GTATTTGAAGTATATGGT------------------CAGGTATGC
289290291292293294295296297298299300301302303304305306307308309310311312
G G G R Y D N L I E L F E G A P T P A V G F A Y
G G G R Y - - - - - - - - - - - T P A V G F A Y
GGTGGCGGTAGATAT---------------------------------ACGCCTGCGGTAGGTTTTGCCTAC
313314315316317318319320321322323324325326327328329330331332333334335336
G F D R I M L N I D D F E V E D K R I L I V P I
G F D R I M L N - - - - - - - - - - - - - - - -
GGATTTGATAGAATTATGTTAAAT------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K K D K K L L K E C L I I A D K L R E M E K I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E V D L M N R K L N K A L N Y A N T V G I S K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I M I G E K E L N E R K I S I K D M E T G E Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418
L I D L E E L S N I
- - - - - - - - - -
------------------------------
Class II
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_his_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E F E P I R G M K D Y Y G E E L N K I K F I
- - - - - - - - - - - - - - - - - - - K I K F I
---------------------------------------------------------CTCTCTTTTTTTAAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E E T F R S V V L N S G Y Q E V Y T P I V E D F
E E T F R S V V L N S G Y Q E V Y T P I V E - -
GAACTTAATGGTAATACTATTTTCTTCCAATTCCTTCTTACCTATCAATGCAATTGCGTCATATCC------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K L F S L K S G E E I R K T M Y V F K D K A D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E V A L R P E I T P S I V R V Y L N S M Q H L P
- - A L R P E I T P S I V - - - - - - - - - - -
------ATTCAGTAACCTTATCGCTAAACTTAAGCTATC---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K P L R L F Y V G Q V Y R Y D E P Q F G R Y R E
- - L R L F Y V G Q V Y R Y - - - - - - - - R E
------TTGTAGATCAGATTTAATTTTGTTTATAACTAATGC------------------------TCCGAT
121122123124125126127128129130131132133134135136137138139140141142143144
F R Q A G V E L L A S S S S F A D I E V I S L L
F R Q A G V E L L - - - - - - - D I E V I S L L
TGCCGGAGTATCAGTTCCACCGTACAA---------------------TCCTCCGCCAGCTATACTAAAACT
145146147148149150151152153154155156157158159160161162163164165166167168
N E I Y D S L G L K D K I I I K I N N I G I Y R
N E I Y D - - - - - - - - - - - - - - - - - - -
TACATCAGGGTGAAC---------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E I F N K A G I S E E Q Q E H L L H L I D K G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V D D A L K E F T D N N Y K D L I T Y L I S L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F D K I E P D K L E S L R K E I S K Y N F N L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G E I N K L S F I C E V L E D L G V K I K I D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G F V R G L A Y Y T G V I F E V V H P D V S F S
- - - - - - - - - - - - I F E V V H - - - - - S
------------------------------------AAGCCCTAGTGAATCATA---------------ACT
289290291292293294295296297298299300301302303304305306307308309310311312
I A G G G R Y D N L V R L Y G G T D T P A I G F
I A G G G R Y - - - - - - - - - - - T P A I G F
GATAACCTCGATGTCTGCAAA---------------------------------TTGTCTAAATTCCCTGTA
313314315316317318319320321322323324325326327328329330331332333334335336
A I G V E R T A L V I N K I K S D L Q R K K I A
A I G V E R T A L V - - - - - - - - - - - - - -
ACGACCGAATTGTGGTTCATCATATCTATA------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V I P L I S T K D S L S L A I R L L N I L R K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N I I G V L N L K D V P L S K L M I Y Y V E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y D A I A L I G K K E L E E N S I T I K F L K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428
R E Q K T V K L E K I E D V L I N N L S
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_his_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G V T L M K V E R P K G T R D F T P E E M R A
- - - - - - - - - - - - - - - - - - - - - - - A
---------------------------------------------------------------------CAC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R R W L E R Y L L D V F R S Y G Y E E V L T P T
R R W L E R Y L L D V F R S Y G Y E E V L T P T
CGACACGTATCCCTCCTTCAGCTCCCGCTCCCCTACGATCACGGCGTAGTCGTACTCGAGCGAGTCCGCCAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F E H A K L F E E K S G E E I L E E M Y V F K D
F E - - - - - - - - - - - - - - - - - - - - - -
TGAGAG------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K K G R K L A L R P E M T A P V V R F Y N A E L
- - - - - - A L R P E M T A P V V - - - - - - -
------------------ACCCGACCTCACGAGCGGTATCAGCAAGGCACG---------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K T R P H P L K L A Y I V N C F R Y E Q P Q R G
- - - - - - L K L A Y I V N C F R Y - - - - - -
------------------GGCCGCGAGGAGGAGCCTGTCGAAACCTATGGCCAT------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R W R E F W Q A G V E V F G S D R P E A D V E V
- - R E F W Q A G V E V F - - - - - - - D V E V
------TCCGAGCTCCTTCACCAGGTCGTCGTAGCGGCC---------------------TCCACCGAGCTC
145146147148149150151152153154155156157158159160161162163164165166167168
I E L T Y R I F D G I L P S G A F E V R V G H L
I E L T Y R I F D - - - - - - - - - - - - - - -
CGGCACGTGTATTTCGAACACCATCCC---------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G I L R G L L E E Y G I G E D V Q N K V A H L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D K G E L D E V K T L L P A E P A E K A L A V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T A R S E S E V E E A V S G K E R A E R A L E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L M E I S D A L R E A G V D H E L D F S V A R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L D Y Y T G M V F E I H V P E L G G G S Q C A G
- - - - - - - V F E I H V - - - - - - - Q C A G
---------------------GATCCGGTAGGTCAGCTC---------------------CGGGCGGTCCGA
289290291292293294295296297298299300301302303304305306307308309310311312
G G R Y D D L V K E L G G P D V P A V G M A I G
G G R Y - - - - - - - - - - - V P A V G M A I G
GCCGAACACCTC---------------------------------CCGCTGCGGCTGCTCGTACCGGAAGCA
313314315316317318319320321322323324325326327328329330331332333334335336
F D R L L L A A E L Y D R I P D G V E E T R A L
F D R L L L A - - - - - - - - - - - - - - - - -
GTTCACGATGTACGCCAGCTT---------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L I P L V R S G K I W E I A A K L R K L G W V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N V E V S G K H I R K A L S L A D S L E Y D Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V I V G E R E L K E G Y V S V K N L K T G V Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421
E V P L D Q L E R A A E V
- - - - - - - - - - - - -
---------------------------------------
Class II
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_his_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Y D R L K G F R D F Y P D E M G P R R V A I D
- - - - - - - - - - - - - - - - - P R R V A I D
---------------------------------------------------GAACGGCGCGGTCACCTGGTC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L E G A A R Q Y G F R E I G T P A L E G Q Q M
A L E G A A R Q Y G F R E I G T P A L E - - - -
GCCGCTCTCCATGTGCTTGACCGTCACCTCGCCGTTCGCGAGGTCCTGCTCGCCCACGAT------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y V D K S G E G I V E E L Y T F T D Q G G R D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L T P E L T P T V A R M V V A K Q Q E L Q K P
A L T P E L T P T V A - - - - - - - - - - - - -
GCCGCGGTCCCGGAGGTCACCCGCGACGCGCGC---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I K W F S T R P F W R Y E E P Q Q G R F R E F Y
I K W F S T R P F W R Y - - - - - - - - R E F Y
GTCGGCGGTGAACTCGCCCTCCGGGAGCACGCCCGC------------------------GGCGTGGCCGGG
121122123124125126127128129130131132133134135136137138139140141142143144
Q T N V D I F G S S D P R A D A E V L A V V A D
Q T N V D I F - - - - - - - D A E V L A V V A D
CGCGACCCCGACCGCGGGCGT---------------------GATGAGGCCGTCGTAGCGCCCGCCGCCGAA
145146147148149150151152153154155156157158159160161162163164165166167168
G L T D L G L T S E D F E F R V S H R D I L G G
G L T - - - - - - - - - - - - - - - - - - - - -
CACCGACCG---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L E A F D A D V D T E E A I R T V D K R E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E F A E Y V D G L E A A G L T R E Q A E R F D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L L A G D D L D A L V E F A G T E R V D D A V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N L R N V L Q A A E N L G V R E Y C D V S L T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A R G L D Y Y T G V V F E C F D A T G E V G R S
- - - - - - - - - - V F E C F D - - - - - - - S
------------------------------GCGGAACTCGAAGTCCTC---------------------GAG
289290291292293294295296297298299300301302303304305306307308309310311312
V F G G G R Y D G L I E S F G G Q P T P A V G V
V F G G G R Y - - - - - - - - - - - T P A V G V
GCCGTCCGCGACTACCGCCAG---------------------------------GAAGATGTCGACGTTCGT
313314315316317318319320321322323324325326327328329330331332333334335336
A P G H A T L G L L L E N A G V L P E G E F T A
A P G H A T L G L L - - - - - - - - - - - - - -
CTGGTAGAACTCCCGGAACCGGCCCTGCTG------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D Y Y V L Q V G D T E A E A A R V A G D L R D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G N V V D T D V T G R S F G A Q M N Y A D G I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A E T V V I V G E Q D L A N G E V T V K H M E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G D Q V T A P F D E F P G E L D A P T V D D Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_his_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I Q K P R G T R D M L P D E M E R R R E I E A
- - - - - - - - - - - - - - - - - R R R E I E A
---------------------------------------------------CGGCGTCGTGAGATAGAAGCA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R M R A R A R L Y G F R E I A T P V F E E L E L
R M R A R A R L Y G F R E I A T P V F E - - - -
CGGATGCGGGCACGGGCACGACTCTATGGTTTTCGGGAGATAGCAACCCCGGTATTTGAA------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F T I R S G E G I I N E M Y V F E D K G G R S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L R P E L T A P V L R M Y V E E G R S L N K P
A L R P E L T A P V L - - - - - - - - - - - - -
GCACTCAGGCCGGAACTGACCGCACCGGTTCTC---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V K W C Y F A D C F R Y E R P Q K G R Y R Q F W
V K W C Y F A D C F R Y - - - - - - - - R Q F W
GTCAAATGGTGCTATTTTGCCGACTGTTTCAGATAT------------------------CGCCAGTTCTGG
121122123124125126127128129130131132133134135136137138139140141142143144
Q F G A E L I G A D S A M G D A E V I T L G Y D
Q F G A E L I - - - - - - - D A E V I T L G Y D
CAGTTCGGGGCAGAACTTATC---------------------GATGCGGAGGTTATCACACTCGGATATGAC
145146147148149150151152153154155156157158159160161162163164165166167168
L L R T A G V T F V L R I G H L S F M R T L L A
L L R - - - - - - - - - - - - - - - - - - - - -
CTTCTCAGG---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D L A D G D K K K I R A F L D K R E E E A A I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y L R D I G R D D L C D P L I R L C G A R T L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D V F A I I G E I P E A A R V R E M F A I L D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S G I P Y E I N P A I A R G L D Y Y T G V V F E
- - - - - - - - - - - - - - - - - - - - - V F E
---------------------------------------------------------------GTCTTTGAA
265266267268269270271272273274275276277278279280281282283284285286287288
C F A E G L G A E N Q I L G G G A Y R L A H L F
C F A - - - - - - - Q I L G G G A Y - - - - - -
TGCTTTGCC---------------------CAGATCCTTGGTGGTGGTGCATAC------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G G E D T P S A G F A I G F D R V M V A L G E A
- - - - T P S A G F A I G F D R V M V A - - - -
------------ACTCCATCGGCCGGATTTGCCATCGGTTTTGACCGGGTAATGGTTGCC------------
313314315316317318319320321322323324325326327328329330331332333334335336
S W V P W Q P Q V M I I T T N E G R D Y A L T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A G Q F R M N G I I T E T D L M D R S F S A Q M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K A A G K S A D Y A V I I G K D E V E T G T I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L K D L K A G T Q E K I T A D E A I Q K L T S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Archaea/Archaeoglobus fulgidus/amino acid sequences/his_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K I E R P R G T R D F L P D E M E R R R E I E
- - - - - - - - - - - - - - - - - - R R R E I E
------------------------------------------------------TTCGAGGTTCTTTATCGC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K R M R K I A E S F G Y R E V A T P T F E Y L E
K R M R K I A E S F G Y R E V A T P T F E - - -
AACTCTCCCACTCTTAACCTCATCCGGGCCGAGTATGACCGCATACTTTACCCCCATTTCGCT---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F T R K S G E G I I E E M Y V F K D K S G R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L A L R P E L T A P V M R M F V N E C S V M P K
- A L R P E L T A P V M - - - - - - - - - - - -
---CCTGAAGGCCTGGCTTTCCAGCCCCTTAAAGGA------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P L R F Y Y F A N C F R Y E R P Q K G R Y R E F
- L R F Y Y F A N C F R Y - - - - - - - - R E F
---GCAAGCCTCACAAACCCTGTCAAAGCCTATAGCGAA------------------------GCCGAAAAG
121122123124125126127128129130131132133134135136137138139140141142143144
W Q F G V E L I G S E S Y L A D A E V I I L A D
W Q F G V E L I - - - - - - - D A E V I I L A D
TGAGGAAAGCTCGTAGCTCCCTCC---------------------TCCGAGCCCTTCAGCGTAGCACTCAAA
145146147148149150151152153154155156157158159160161162163164165166167168
K I L K D V G V N F S L E I G H V G I M R H L L
K I L K - - - - - - - - - - - - - - - - - - - -
TACGACGCCCGT------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K P I G E D R A S K V M R L I D K G D R E G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S Y L A E I R V N E D L R D K I F S L L E L K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D E S V I E E A K E I I D Y D F G H L E S L S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L L R D V G V D F T L N L G I A R G L D Y Y T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V V F E C Y A E G L G A Q K Q V C G G G S Y E L
- V F E C Y A - - - - - - - Q V C G G G S Y - -
---TTTATCTGCAAGGATTAT---------------------CGATTCAGAACCAATCAGCTCAAC------
289290291292293294295296297298299300301302303304305306307308309310311312
S S L F G G P V T P S T G F A I G F D R V C E A
- - - - - - - - T P S T G F A I G F D R V C E A
------------------------CTTCTGCGGCCTCTCGTAGCGGAAGCAGTTTGCGAAGTAGTAAAAGCG
313314315316317318319320321322323324325326327328329330331332333334335336
C S V E A G E K S V V A V V S F K G L E S Q A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R V A S M L R E R G F T A V V D V M G R N L K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q M S F A S E M G V K Y A V I L G P D E V K S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R V A I K N L E T Q E Q V V V A E E E L F S I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409
Q
-
---
Class II
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_his_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D I S R P R G T R D F L F A E M R N R K E V E
- - - - - - - - - - - - - - - - - - N R K E V E
------------------------------------------------------AACAGGAAAGAGGTTGAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G V L R R T F E T Y G Y H E I K T P I F E E L K
G V L R R T F E T Y G Y H E I K T P I F E - - -
GGTGTACTCAGAAGGACATTCGAGACCTATGGCTACCATGAGATCAAGACACCAATATTTGAG---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F T V K S G E E V V N Q I Y H F T D K G G R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L A L R P E L T A P V A R L Y M N E M Q K K P K
- A L R P E L T A P V A - - - - - - - - - - - -
---GCCCTGAGACCTGAACTCACAGCACCCGTGGCA------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P I K M Y Y F G S C F R Y E R P Q A G R F R Q F
- I K M Y Y F G S C F R Y - - - - - - - - R Q F
---ATAAAGATGTACTACTTCGGGAGCTGCTTCAGGTAT------------------------AGACAGTTC
121122123124125126127128129130131132133134135136137138139140141142143144
W Q F G C E L I G G R S P L A E A E V I S L A S
W Q F G C E L I - - - - - - - E A E V I S L A S
TGGCAGTTCGGATGCGAACTCATA---------------------GAGGCTGAGGTGATATCCCTAGCATCT
145146147148149150151152153154155156157158159160161162163164165166167168
E S L H E L G L D G F E V H I G H L G I L R G I
E S L H - - - - - - - - - - - - - - - - - - - -
GAATCCCTCCAT------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L G R E E I P S E L Q D R I M G V I D K G D V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E L E A L L G E V E V S G E S R E L L M K L I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T Q G G P E V L D D V E E Y L G G Y S E S L E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L E E F R E L V E T L H Y F G V D D Y H V N L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I A R G L D Y Y T G I V F E I Y V P E L G A Q K
- - - - - - - - - - - V F E I Y V - - - - - - -
---------------------------------GTATTCGAGATCTACGTG---------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q I C G G G T Y N L V E T F G G E R V E S T G F
Q I C G G G T Y - - - - - - - - - - V E S T G F
CAGATATGTGGCGGAGGGACCTAC------------------------------GTCGAATCAACGGGATTC
313314315316317318319320321322323324325326327328329330331332333334335336
A F G F D R L M N A L G M D E E N M R M V D V F
A F G F D R L M N A - - - - - - - - - - - - - -
GCCTTCGGCTTTGACAGGCTCATGAACGCC------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V I P I Q D S T V P E A I R I T Q E L R A A G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S A D L E V S G R K L R K A L S H A D N L G A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F A V L T G E R E I Q D G K V T V K D M E R N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425
Q E T L P R D E M V D K I K G R C
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_his_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S G L P D H L R R P V R G M R D W L P P Q Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L R H M E E V L C K V A E S F G Y R R V E T P
A L R H M E E V L C K V A E S F G Y R R V E T P
CTTTTCTAACTCCTTTCGGCCAATAATTATTATGTGTCTAGCCCCGACTTTTAACGCGTATTCAAAGGCGTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V V E H F E V L A K K A G Q D V I N E I Y Y F K
V V E - - - - - - - - - - - - - - - - - - - - -
TTTTAGACC---------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D K A G R D L G L R F D M T V P V A R V L S Y N
- - - - - - - G L R F D M T V P V A - - - - - -
---------------------ATCAAAAATATATATGTAGTAGTCCAGCGGCCT------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E L P R P V R W Y Y F T K V F R Y D E P Q H G
- - - - - - V R W Y Y F T K V F R Y - - - - - -
------------------CTCTACGCCTATGGCAAATCCCAGCGCCGGGGTTTT------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R Y R E F Y Q F G V E L V G S S S P R A D A E V
- - R E F Y Q F G V E L V - - - - - - - D A E V
------ATCGTCGTAACGCCCGCCGCCGCCGACGGCGAG---------------------CTCGAAGACTAT
145146147148149150151152153154155156157158159160161162163164165166167168
I Q L L I A S L E A A G A S N F Y V R I N D R R
I Q L L I A S L E - - - - - - - - - - - - - - -
TCCAGTGTAGTAATCCAGCCCCCTTAC---------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A V D K L L E H L G V A P Y R D I I Y K A L D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K L K L P R E D V I K I M T G G G V S K E I A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E I Y N T A T E I T I Q E A V E L L Y K L D K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L G A S Y E K I V K Y L E A S V P M E R L K F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
M S I V R G L D Y Y T G I V F E A F V G E Y K L
- - - - - - - - - - - - - V F E A F V - - - - -
---------------------------------------CTCGGCGTCGGCCCTGGG---------------
289290291292293294295296297298299300301302303304305306307308309310311312
A V G G G G R Y D D L L E L Y S G V K T P A L G
A V G G G G R Y - - - - - - - - - - - T P A L G
TAGCTCCACGCCGAATTGGTAAAA---------------------------------TCTAAAGACTTTTGT
313314315316317318319320321322323324325326327328329330331332333334335336
F A I G V E R L M E A V G I Q N V E R P L D Y Y
F A I G V E R L M E A - - - - - - - - - - - - -
GAAGTAGTACCAACGCACTGGCCTTGGCAGTTC---------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I Y I F D D D A Y K Y A A A V A K K L R T E G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S V V V E L G E K G L K D A F E Y A L K V G A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
H I I I I G R K E L E K G V I K V R D L E K R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419
E V E K P L S Q F L A
- - - - - - - - - - -
---------------------------------
Class II
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_his_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I L P P R G T K D F T P E L A I L W K E I V S
- - - - - - - - - - - - - - - - - L W K E I V S
---------------------------------------------------TCTTTCCCTTGTTAGCCTATC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K I E S V Y Q K Y G F D P I I T P I V E Y W D T
K I E S V Y Q K Y G F D P I I T P I V E - - - -
TTGAAATGTTACTAAATTATTGGCTAAATCCTTTTTACCAACAATAACTAAATACCTAAT------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L K G K Y G E E A E K K E I W R F R V P Q S K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
W Y A L K Y D Q T V P L A R Y F A R F R P K L P
- - A L K Y D Q T V P L A - - - - - - - - - - -
------GGCAATTCTCCATGCTTCTTTGAAAACCTCTAT---------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F K R Y T I D R T F R Y D E P Q K G R Y R E F W
F K R Y T I D R T F R Y - - - - - - - - R E F W
GTTTAGATTAAATATACCTTTTTCTAAACCAACATC------------------------CCCTCCAACGGC
121122123124125126127128129130131132133134135136137138139140141142143144
Q A D A D I V G S P Y P E A D A E I L N M M I E
Q A D A D I V - - - - - - - D A E I L N M M I E
AGGAATTTTTTCTTTAGAAAA---------------------CCTACCACCTCCGCCCAGGGCTCTATTAAA
145146147148149150151152153154155156157158159160161162163164165166167168
A Y E T L G F N V Y L R V S D R R A L E S L I E
A Y E - - - - - - - - - - - - - - - - - - - - -
ACCTTCAAT---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K V G E K D K F I E I A R I I D K W D K I G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G V L E K L K Q I T D K A E K I I E L L K E N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E E F Y P K E F W E I I D L V E K K N K I K I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I K L A R G F D Y Y T G M V Y E V W I E G F N R
- - - - - - - - - - - - - V Y E V W I - - - - -
---------------------------------------ATTAAATCCTAAAGTTTC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
A L G G G G R Y D N L I G I F S K E K I P A V G
A L G G G G R Y - - - - - - - - - - - I P A V G
CATATTTAATATCTCTGCATCCGC---------------------------------GGCTTGCCAAAACTC
289290291292293294295296297298299300301302303304305306307308309310311312
G S I G I N P L I D V G L E K G I F N L N K K T
G S I G I N P L I . V G - - - - - - - - - - - -
TCTATATCTTCCTTTTTGTGGTTCATC---TCTAAA------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y T Q I A V I Y I E V F K E A W R I A N K L R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L G L N V Y I D L L R R D F K K Q M E Y V I E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D I R Y L V I V G K K D L A N N L V T F Q D R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404
T R E R K K I P I E N L E E I K S L V Q
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_his_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T V N R P R G T R D F L P A D T A R R R Y V E
- - - - - - - - - - - - - - - - - - R R R Y V E
------------------------------------------------------CGGAGAAGGTACGTGGAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S V M R N V V R N W G Y S E I I T P T F E H L D
S V M R N V V R N W G Y S E I I T P T F E - - -
AGCGTTATGCGAAATGTTGTCCGCAACTGGGGATACAGTGAAATCATTACGCCTACATTTGAA---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F T L K S G E G I V G E L Y N F T D K G G R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M T L R P E L T A P V M R L Y V N E L Q P F P K
- T L R P E L T A P V M - - - - - - - - - - - -
---ACCCTCAGGCCGGAACTTACGGCTCCTGTCATG------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P L K L F Y F E N C F R Y E R P Q K G R F R E F
- L K L F Y F E N C F R Y - - - - - - - - R E F
---TTGAAGTTATTCTACTTTGAAAATTGTTTCCGCTAC------------------------AGAGAATTC
121122123124125126127128129130131132133134135136137138139140141142143144
W Q F G V E L I G S G K S D S D A E V I A L A D
W Q F G V E L I - - - - - - - D A E V I A L A D
TGGCAGTTCGGAGTCGAACTCATC---------------------GACGCCGAGGTTATTGCCCTTGCCGAT
145146147148149150151152153154155156157158159160161162163164165166167168
A L L K A V G I Q G D M K L G N L A V I R T L L
A L L K - - - - - - - - - - - - - - - - - - - -
GCCCTGTTAAAA------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K G L E P E I V S K V M R L V D K K E Y A G L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S L L E E I G A E E Q L K S D L F H L I H L E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K Y I L P K V K E I V G N I P E L V G F E K T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K L L D A Y G V D Y S L D F G I A R G L D Y Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G M V F E V Y A E G L G A Q K Q V C G G G S Y Q
- - V F E V Y A - - - - - - - Q V C G G G S Y -
------GTCTTTGAGGTTTATGCC---------------------CAGGTCTGCGGGGGTGGCTCTTAC---
289290291292293294295296297298299300301302303304305306307308309310311312
L I Q L F G G G D V P S T G F G I G F D R I M E
- - - - - - - - - V P S T G F G I G F D R I M E
---------------------------GTGCCTTCCACGGGCTTCGGAATAGGTTTTGACAGGATTATGGAG
313314315316317318319320321322323324325326327328329330331332333334335336
I C P L V P P A S K N L V L V S K P A T H I E A
I - - - - - - - - - - - - - - - - - - - - - - -
ATC---------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V K V A S E L R N Y L P V Q I D L M E R N F K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q F S Y A N T I N A D Y V V I V G E K E L E A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K L T L R D M V S G E Q E L L T L E E I I E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413
T G Q Q D
- - - - -
---------------
Class II
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_his_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I E R V K G T R D F L P E D M A K R R W V F E
- - - - - - - - - - - - - - - - - K R R W V F E
---------------------------------------------------GTTATATTGCTCTCCACTTTC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K I R E V F E A Y G F K E I L T P V M E Y T K L
K I R E V F E A Y G F K E I L T P V M E - - - -
CATATCCCTTATTGTTACAACCCCTCTCTCAACATCTCTCTTCCCAACTATTATGACTAA------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F Q L R S G E E V V K Q L Y A F K D K G G R D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S L R P D M T S S V A R L Y V N S F Q M A P K P
S L R P D M T S S V A - - - - - - - - - - - - -
CCTTAACTTTACTGCTATATTAATTGCAACTTT---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I K W Y Y I A N M F R Y E E P Q S G R Y R E F W
I K W Y Y I A N M F R Y - - - - - - - - R E F W
AGTTTGAGGTTTGGGAATTAAACCTTTCCATTCCAG------------------------AATTGCGAATCC
121122123124125126127128129130131132133134135136137138139140141142143144
Q A G V E L I G S D K V E A D A E V I A L F V E
Q A G V E L I - - - - - - - D A E V I A L F V E
AGTGGCCGGTGTTGGCTTTCC---------------------ATCGTACCTCCCCCCTCCCCCTATGGATCC
145146147148149150151152153154155156157158159160161162163164165166167168
S Y L S T G L R D F T V N I G D R I L L D E F A
S Y L - - - - - - - - - - - - - - - - - - - - -
TATCCCAAG---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G M L G V S D D I G L M R I I D K R D K L S Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E F I N L L K E F G L G E S E I E K V L E L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I K G R P D N V L P L A E E L F K S K K A K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I S K L Y K L T D L L E W Y G V K D W I R I D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G I A R G F D Y Y T S I V F E A I S P N E L G I
- - - - - - - - - - - - V F E A I S - - - - - -
------------------------------------AACCGTAAAATCTCTGAG------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G S I G G G G R Y D N L I E I F G G K P T P A T
- S I G G G G R Y - - - - - - - - - - - T P A T
---AACGAATAATGCTATAACCTCTGC---------------------------------AACTCCGGCCTG
313314315316317318319320321322323324325326327328329330331332333334335336
G F A I G I E R L L P I L E W K G L I P K P Q T
G F A I G I E R L L . I L - - - - - - - - - - -
CCAAAATTCCCTGTAACGACCACTTTGAGG---TTCGTA---------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G P E V F V I P L K D M E K V A I N I A V K L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R E K I K T D I E L S G R K L G K A L D Y A N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V G A K L V I I V G K R D V E R G V V T I R D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431
E S G E Q Y N V S L N E I V D K V K N L L K R
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_his_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S L E P T F R N I R G T F D I L P Q D G R S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G T H D M P S R A W Q H V E Q V V R E V L E R F
- - - - - - - - A W Q H V E Q V V R E V L E R F
------------------------GCCTGGCAGCACGTCGAACAGGTCGTCCGGGAGGTGCTCGAACGCTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N F R E I R T P I L E P T E L I A R G V G Q L T
N F R E I R T P I L E - - - - - - - - - - - - -
AACTTCCGGGAGATTCGCACGCCGATTCTGGAA---------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D I V T K E M F A F R R G D T N Y V L R P E V T
- - - - - - - - - - - - - - - - - V L R P E V T
---------------------------------------------------GTGCTGCGCCCCGAGGTGACG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A P V M R A Y L Q H R L D Q Q G A V Q K L Y Y I
A P V M - - - - - - - - - - - - - - Q K L Y Y I
GCGCCGGTCATG------------------------------------------CAGAAGCTCTACTACATC
121122123124125126127128129130131132133134135136137138139140141142143144
G P C F R A E N P Q K G R Y R Q F H Q F G V E L
G P C F R A - - - - - - - - R Q F H Q F G V E L
GGCCCCTGCTTCCGGGCC------------------------CGGCAGTTCCACCAGTTCGGCGTCGAGCTG
145146147148149150151152153154155156157158159160161162163164165166167168
I G A E T P E A D A E V I A A M M A V Y E A F G
I - - - - - - - D A E V I A A M M A V Y E - - -
ATC---------------------GACGCCGAGGTGATCGCGGCCATGATGGCCGTCTACGAG---------
169170171172173174175176177178179180181182183184185186187188189190191192
L K N L R L R I N T L G D A E S R P R Y R E A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R A Y L Q P L A D R L T P T S R Q R L E T N P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R I L D T K D E R E R R L L E G A P R I I D F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D E K G R A H Y E A V K A H L Q A L G I A F E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D P F L V R G L D Y Y T H T T F E L E S P D L G
- - - - - - - - - - - - - - T F E L E S - - - -
------------------------------------------ACGTTCGAGCTGGAGAGC------------
289290291292293294295296297298299300301302303304305306307308309310311312
A Q S A L A G G G R Y D L L A M D L G H D A P V
- - - A L A G G G R Y - - - - - - - - - - - - V
---------GCGCTGGCCGGCGGCGGACGCTAC------------------------------------GTG
313314315316317318319320321322323324325326327328329330331332333334335336
P A V G F A A G I E R L F I A L Q A Q G Y A F P
P A V G F A A G I E R L F I A - - - - - - - - -
CCGGCCGTGGGCTTTGCGGCGGGTATCGAGCGGCTGTTCATCGCG---------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E E P P L D A Y L V S L G E A A M R R A L V E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q A L R R A G L R V D L D L K G R S M K A Q M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E A N R Q Q A R Y A V I M G D R E L A E G R A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V R D M Q S G Q Q Q E V P L D E L A D F L K G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436
V R V S
- - - -
------------
Class II
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_his_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I V M F Q K P R G T R D F L P E E M K K R R F
- - - - - - - - - - - - - - - - - - - - K R R F
------------------------------------------------------------AAAAGAAGATTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V E N K L R E V F E R Y G Y K E I L T P T F E S
V E N K L R E V F E R Y G Y K E I L T P T F E -
GTTGAAAATAAGCTAAGAGAGGTTTTTGAGAGGTATGGGTATAAGGAGATATTAACCCCAACCTTTGAA---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F E L I A K K T G E E I R K Q L Y V F K D H G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R E M A L R P E M T S P V V R F Y L N E L K N L
- - - A L R P E M T S P V V - - - - - - - - - -
---------GCTTTAAGACCAGAGATGACATCCCCGGTTGTT------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q K P L R L Y Y F A N C F R Y E R P Q A G R F R
- - - L R L Y Y F A N C F R Y - - - - - - - - R
---------TTAAGGCTTTATTATTTCGCTAATTGTTTTAGATAT------------------------AGA
121122123124125126127128129130131132133134135136137138139140141142143144
E F W Q M G C E L I G C K E P L A D A E V L N L
E F W Q M G C E L I - - - - - - - D A E V L N L
GAGTTTTGGCAGATGGGTTGTGAGTTAATA---------------------GATGCTGAGGTTTTGAATTTA
145146147148149150151152153154155156157158159160161162163164165166167168
A M D G L I N I G L D F D V H I G H L G V L K G
A M D G L I - - - - - - - - - - - - - - - - - -
GCAATGGATGGATTGATA------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V L E K F N V S E E E E V K I R R L I D K E D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D N L K I Y L T Q I L G E E K K E L I F E I L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F K G S R E V L D E L K E I L K D F P K S M E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I N N L E E I L E F V I H D K Y T I N L G I A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G L D Y Y T G M V F E I Y G K K G A K Q I C G G
- - - - - - - - V F E I Y G - - - - - Q I C G G
------------------------GTATTTGAAATCTATGGG---------------CAGATATGTGGTGGC
289290291292293294295296297298299300301302303304305306307308309310311312
G R Y D N L I E T F G G E P T P A V G F A Y G F
G R Y - - - - - - - - - - - T P A V G F A Y G F
GGGAGATAC---------------------------------ACTCCAGCTGTTGGTTTTGCCTATGGATTT
313314315316317318319320321322323324325326327328329330331332333334335336
D R I M M N I D D L D I E E E S I L I I P V K K
D R I M M N - - - - - - - - - - - - - - - - - -
GATAGGATTATGATGAAT------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D K E L I K K S L I I A D K L R K A G K I V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E I M G R K L R K A L D Y A N S R G F K K V I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V G E K E L N E G K V T V K D M I T G E Q K L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416
G I D E L T N F
- - - - - - - -
------------------------
Class II
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_his_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K V P L E P L R G F R D I L P P E S E A L R
- - - - - - - - - - - - - - - - - - - - - A L R
---------------------------------------------------------------GCCCTCAGA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R L A E I F A R I A R S Y G Y G E V K P P T L E
R L A E I F A R I A R S Y G Y G E V K P P T L E
AGACTGGCCGAGATATTCGCGAGGATAGCCAGGTCCTATGGTTACGGCGAGGTGAAGCCACCTACGCTCGAG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R F Q L F A V K S G E E I R R S M Y V F R D K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R E V A L R P E A T A S I A R I Y L R L L R G
- - - - A L R P E A T A S I A - - - - - - - - -
------------GCACTCCGGCCAGAGGCAACCGCCAGCATAGCC---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q P K P V R L Y Y V V N C F R Y E E P Q R A R Y
- - - - V R L Y Y V V N C F R Y - - - - - - - -
------------GTGAGGCTATACTATGTAGTCAACTGCTTCCGCTAC------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R E F W Q A G V E L L G E P S I L G D F E V I K
R E F W Q A G V E L L - - - - - - - D F E V I K
CGCGAGTTCTGGCAGGCCGGGGTAGAGCTTCTC---------------------GACTTCGAGGTCATAAAG
145146147148149150151152153154155156157158159160161162163164165166167168
L L L K F Y E S I D M L D H I V L K I G N T R L
L L L K F Y E - - - - - - - - - - - - - - - - -
TTACTGCTCAAGTTCTACGAG---------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y R R L F A K H G I S E E I Q D H I L H L M D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G M Y K E A L E A L M G A E H P G L A S I L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L W S N A R D D I D A A K N I L S K S G E E I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E S L E E L K K L V D M L K G Y N S R L N L E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D L A F A R G L A Y Y T G T I F E V K V P G F P
- - - - - - - - - - - - - - I F E V K V - - - -
------------------------------------------ATATTCGAGGTAAAGGTG------------
289290291292293294295296297298299300301302303304305306307308309310311312
V S I A G G G R Y D N L I E L Y G G E K V P G T
- S I A G G G R Y - - - - - - - - - - - V P G T
---AGCATAGCCGGGGGAGGCCGCTAC---------------------------------GTGCCGGGCACG
313314315316317318319320321322323324325326327328329330331332333334335336
G F A I G L D R T L A A M E S S G L R P R I I Y
G F A I G L D R T L A A - - - - - - - - - - - -
GGATTCGCCATAGGGCTTGACCGCACACTAGCAGCT------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Q E P V R I A V I V L D E S L A P Y A A K V Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I L A S K D N V S A A L Y T G S K L Q K M L P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L A K Q G Y H Y A A I V G K Q E A R E G K L V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R D L A K R E Q R V L T L E E L R E L N L T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435
E F R
- - -
---------
Class II
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_his_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I N A L K G M K D L L D K D A Y Y Y E K V I K
- - - - - - - - - - - - - - - - - Y Y E K V I K
---------------------------------------------------TGCTAAATTTTTATAAAACAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I C E E V A K N Y G F T F I N T P H L E L C T L
I C E E V A K N Y G F T F I N T P H L E - - - -
ACTTTCATTTTGTGCTTCATTTTCTCCCATGCAAAGAAAAATTTCAGTATTATTTTTATC------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F K R S V G E S S D I V G K E M Y E F I D K G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N H V C M R P E G T A G V V R A Y I E K K L D K
- - - C M R P E G T A G V V - - - - - - - - - -
---------TTGGATATAAATTTCATCCATAGCACAAAGATA------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N T S V K R W F Y Y G S M F R Y E R P Q K G R L
- - - - K R W F Y Y G S M F R Y - - - - - - - -
------------AGTTATAATTCTTTCTATACCCATGGCAAAACCTAT------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R E F H Q F G V E S L G I P N V Y E D A S I I L
R E F H Q F G V E S L - - - - - - - D A S I I L
ATACTCTATAAGTCTATCGTAGCGTCCTCCACC---------------------TATTTCATCGCTTATAAA
145146147148149150151152153154155156157158159160161162163164165166167168
M L V E I F S R L G I D F K L Q L N S L G C S Q
M L V E I F S - - - - - - - - - - - - - - - - -
TTCAAAAGCCGTTTTAGAATA---------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
C L P K Y R D R L V E F L D S K E G F C E D C L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R R K N L N P I R V L D C K N E H C Q N L L E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A P L L I N N L C T S C Q K D F E T L Q Q I L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D N G V K F E L D S K L V R G L D Y Y S K T A F
- - - - - - - - - - - - - - - - - - - - - - A F
------------------------------------------------------------------TACTAG
265266267268269270271272273274275276277278279280281282283284285286287288
E F I S D E I G A K A A I A G G G R Y D R L I E
E F I S - - - - - - - A I A G G G R Y - - - - -
CATTAAAATAAT---------------------AGGTATGCCAAGGCTTTCAACTCC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y L G G K S G Y G I G F A M G I E R I I T I L E
- - - - - - G Y G I G F A M G I E R I I T I - -
------------------AGGTCTTTCATAACGAAACATAGAACCATAATAAAACCATCTTTTCAC------
313314315316317318319320321322323324325326327328329330331332333334335336
Q K E E K I Q R E G I Y L C A M D E I Y I Q K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L H I A T N L R K E Y K V L L S Y E A R K L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H L E N A D K N N T E I F L C M G E N E A Q N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S L F Y K N L A K K E E K M I K I S D L K K V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_his_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P S T P V S D L Q A P R G T R D F Y P E E M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R H R R L L D A W R R V S L R N G F E E V D G P
R H R R L L D A W R R V S L R N G F E E V D G P
CGGCACCGCCGGCTGCTCGACGCGTGGCGGCGCGTGTCCCTCCGCAACGGCTTCGAGGAGGTCGACGGGCCC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I F E T L D L Y K V K S G D G I V S E L F S F R
I F E - - - - - - - - - - - - - - - - - - - - -
ATCTTCGAG---------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R D G G S T D Y A L R A E F T P T L A R M V A K
- - - - - - - - A L R A E F T P T L A - - - - -
------------------------GCGCTGCGCGCCGAGTTCACGCCGACGCTGGCC---------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R A N G L P K P I K W F A T P N F C R A E R P Q
- - - - - - - - I K W F A T P N F C R A - - - -
------------------------ATCAAGTGGTTCGCCACGCCGAACTTCTGCCGGGCC------------
121122123124125126127128129130131132133134135136137138139140141142143144
R G R L R E F W Q W N V D F L G E A G P S A D A
- - - - R E F W Q W N V D F L - - - - - - - D A
------------CGCGAGTTCTGGCAGTGGAACGTCGACTTCCTC---------------------GACGCC
145146147148149150151152153154155156157158159160161162163164165166167168
E V V F V L V D L L R E L G V R E G Q V Q V R I
E V V F V L V D L L R - - - - - - - - - - - - -
GAAGTCGTCTTCGTGCTCGTCGACCTGCTGCGC---------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S H R A V V A Q V L Q R L G V P A E R L T E A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E L L D S R S K L E P G V F A E R A A G L G L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P P K V Q R L D E V C R R R F A A G D L G H L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R A L G M D A P P D D L V G L D A Q L V A F G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A G W C A Y D L G V V R G L A Y Y T G T V F E A
- - - - - - - - - - - - - - - - - - - - V F E A
------------------------------------------------------------GTGTTCGAGGCC
289290291292293294295296297298299300301302303304305306307308309310311312
F E T A G V E R A L A G G G R Y D R L I E T F G
F E - - - - - - A L A G G G R Y - - - - - - - -
TTCGAG------------------GCGCTCGCCGGCGGAGGCCGCTAC------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G P A M P A V G F G M G D V V L A N L L R D K K
- - - M P A V G F G M G D V V L A N L - - - - -
---------ATGCCCGCCGTCGGCTTCGGCATGGGCGACGTGGTGCTCGCGAACCTG---------------
337338339340341342343344345346347348349350351352353354355356357358359360
L E P E H A G D G P D V F I V P L A D A D P A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V T G W V A R L R S G G L H A R T T Y K P T R N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T G K L L K E A T G A R A R F A L L V G V D S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431
E L K N L A T G E Q Q A I A D E D V A S R L R
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_his_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V H Q P P A G T R D L L P Q D V T Q K R W I E
- - - - - - - - - - - - - - - - - - Q K R W I E
------------------------------------------------------CAAAAGCGCTGGATCGAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S R L Q Q V F Q Q W G Y Q R I I T P T L E R L D
S R L Q Q V F Q Q W G Y Q R I I T P T L E - - -
AGCCGCTTGCAGCAGGTTTTTCAGCAGTGGGGCTATCAACGCATCATCACGCCGACATTGGAG---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T L V A G G A V Q R S A V I Q V Q S D E E S G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G L R P E L T A S I A R A A V T R L A G S S L P
G L R P E L T A S I A - - - - - - - - - - - - -
GGACTGCGGCCGGAGTTGACGGCTTCGATCGCG---------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L R L Y Y L A N V F R P A F Q G D R L Q Q R E L
L R L Y Y L A N V F R P - - - - - - - - - R E L
CTGCGGCTCTACTACCTCGCCAATGTCTTTCGTCCG---------------------------CGCGAACTG
121122123124125126127128129130131132133134135136137138139140141142143144
F Q A G V E L L G V G G T L A D A E V L H V L A
F Q A G V E L L - - - - - - - D A E V L H V L A
TTTCAAGCTGGCGTGGAACTGCTG---------------------GATGCTGAAGTGTTGCACGTGCTGGCG
145146147148149150151152153154155156157158159160161162163164165166167168
D A L A E L G F G Q P P L G S W H L V V G E A S
D A L A - - - - - - - - - - - - - - - - - - - -
GATGCTTTGGCG------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L T R S L L Q P F P K D L R E K V R Q A I A Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D R V T L E S L P L E S Q L R D R A L L L H D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R G Q P D Q V F A K L Q Q L T L T P L E Q T L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D R L A Q L V E L Y N A S A G P Q D S P L L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L S L L R S F D Y Y T G I V F E V V Y E T P T G
- - - - - - - - - - - - - V F E V V Y - - - - -
---------------------------------------GTCTTCGAAGTCGTCTAT---------------
289290291292293294295296297298299300301302303304305306307308309310311312
P W V L A Q G G R Y D R L L D V Y D P Q A A G Q
- - V L A Q G G R Y - - - - - - - - - - - - - Q
------GTGTTGGCTCAGGGCGGCCGCTAT---------------------------------------CAG
313314315316317318319320321322323324325326327328329330331332333334335336
P G I G F S C N I E N L Q Q V L L A A N R L P H
P G I G F S C N I E N L Q Q V - - - - - - - - -
CCCGGCATCGGTTTCTCCTGCAACATTGAGAACCTGCAACAGGTA---------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R P P A I D Q L V I P V D S E A Y G A A L A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q R L Q R Q D Q L R V E L Y L D S D R R P E V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q A F A Q R R R I G R I V W V S S G S A P Q S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420
A V A V A E R A T T T C
- - - - - - - - - - - -
------------------------------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_his_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A A K P G I P K G T R D F S P V E M A K R N Y
- - - - - - - - - - - - - - - - - - - - K R N Y
------------------------------------------------------------CATGTTTTTCAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I F N T I R D V Y H L Y G F Q Q I E T P S M E M
I F N T I R D V Y H L Y G F Q Q I E T P S M E -
CATAGCTTTTCCTTCATTCATTTCATTCTCACCTACGATAGCAACGAAAGGAATGTTCTTAACATTTGC---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L S T L M G K Y G E E G D K L L F K I Q N S G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y F S G I T D E E L L S R N A A K L A S K F C E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K G L R Y D L T V P F A R Y V V M H R D E I T F
- G L R Y D L T V P F A - - - - - - - - - - - -
---CTTCGGATACAGTTCCAACTGGTTGAGCACATC------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P F K R Y Q I Q P V W R A D R P Q K G R Y R E F
- F K R Y Q I Q P V W R A - - - - - - - - R E F
---TACTCCTGCCATACCGAATACACCAGTCAGGTTATC------------------------GCCAATCTG
145146147148149150151152153154155156157158159160161162163164165166167168
Y Q C D A D V V G S D S L L N E V E L M Q I V D
Y Q C D A D V V - - - - - - - E V E L M Q I V D
CACATCAAGCGCCTTCACCTCAAA---------------------CAATCCACGTGCCAATGTCAAGTCAAG
169170171172173174175176177178179180181182183184185186187188189190191192
T V F T R F G I R V C I K I N N R K I L T G I A
T V F T - - - - - - - - - - - - - - - - - - - -
CTCTATTTCGTT------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E I I G E A D K I V D I T V A I D K L D K I G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D N V N K E L A E K G I S G E A I A K L Q P I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L L S G T N A E K L A T L K T V L S D S E T G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K G V E E S E F I L N T L Q T M G L K N E I E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D L T L A R G L N Y Y T G A I F E V K A L D V Q
- - - - - - - - - - - - - - I F E V K A - - - -
------------------------------------------GCCTACGACATCAGCATC------------
313314315316317318319320321322323324325326327328329330331332333334335336
I G S I T G G G R Y D N L T G V F G M A G V S G
- - S I T G G G R Y - - - - - - - - - - - V S G
------GTAACGTCCTTTCTGAGGACGGTC---------------------------------GAAAGGGAA
337338339340341342343344345346347348349350351352353354355356357358359360
V G I S F G A D R I F D V L N Q L E L Y P K E A
V G I S F G A D R I F D V - - - - - - - - - - -
AGTAATTTCGTCACGGTGCATCACTACATAACGGGCGAA---------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V N G T Q L L F I N F G E K E A A F S M G I L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K A R A A G I R A E I F P D A A K M K K Q M S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A N V K N I P F V A I V G E N E M N E G K A M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454
K N M E S G E Q Q L V T A E E L I G A L T K
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_his_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P F Q I P R G T Q D V L P G E T E K W Q H V E
- - - - - - - - - - - - - - - - - - K W Q H V E
------------------------------------------------------AAATGGCAGCATGTCGAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q V V R S L C G R Y G Y E E I R T P I F E H T E
Q V V R S L C G R Y G Y E E I R T P I F E - - -
CAAGTCGTCCGCAGCCTTTGCGGACGGTATGGCTATGAGGAAATCCGCACACCGATTTTTGAA---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F L R G V G D T T D I V Q K E M Y T F E D K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R A L T L R P E G T A P V A R A F V E H K L Y
- - - - T L R P E G T A P V A - - - - - - - - -
------------ACGCTCCGCCCGGAAGGAACAGCGCCGGTTGCC---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G S P N Q P V K L Y Y T G P M F R Y E R P E S G
- - - - - - V K L Y Y T G P M F R Y - - - - - -
------------------GTCAAGCTCTATTACACTGGACCGATGTTCCGCTAT------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R F R Q F V Q F G V E V L G S S D P A V D A E V
- - R Q F V Q F G V E V L - - - - - - - D A E V
------CGCCAGTTTGTGCAGTTTGGCGTCGAAGTGCTT---------------------GATGCGGAAGTG
145146147148149150151152153154155156157158159160161162163164165166167168
I A L A M H I Y N E L G L Q H I R L V I N S L G
I A L A M H I Y N - - - - - - - - - - - - - - -
ATCGCACTGGCGATGCACATTTATAAC---------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D L D S R R A H R E A L V R H F E S R I H E L C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E D C Q A R L Q T N P L R I L D C K K D R G H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L M A T A P S I L D Y L N D E S R A Y F E K V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H Y L A V L D I P F V I D S R L V R G L D Y Y N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H T T F E I M S D L E G F G A G A T L C G G G R
- - T F E I M S - - - - - - - - - T L C G G G R
------ACATTTGAAATTATGAGC---------------------------ACGCTGTGCGGCGGCGGTCGT
289290291292293294295296297298299300301302303304305306307308309310311312
Y N G L V Q E I G G P E T P G I G F A L S I E R
Y - - - - - - - - - - - T P G I G F A L S I E R
TAC---------------------------------ACGCCGGGCATCGGCTTTGCGCTCAGCATTGAGCGC
313314315316317318319320321322323324325326327328329330331332333334335336
L L A A L E A E G G E L P V R R G L D C Y V V A
L L A A - - - - - - - - - - - - - - - - - - - -
CTCCTGGCGGCT------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V G E Q A K T E A V R L V Y E L R R A G L R V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q D Y L G R K M K A Q L K A A D R L G A S F V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
M I G D E E L E S G A A T V K D M A S G E Q M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426
V P F G E L A H V L A K R T G R E E
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_his_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P I T P R A Y K G M R D H L P E A M R L R R F
- - - - - - - - - - - - - - - - - - - - L R R F
------------------------------------------------------------CGAGCGTAAATC
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I T D T L I G I L E R Y G F E P L S T P I V E Y
I T D T L I G I L E R Y G F E P L S T P I V E -
TTTGAGCTGTACTACGCCTGCAGCCAAATCATCGGGGCCAAGCACCAAGGCAAAATTCGCACCCTTGCG---
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S E T L E G K I G D E E K L L Y R L K Y G D D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L T L R Y D Q T V P L A R V V A Q N E G K L T M
- T L R Y D Q T V P L A - - - - - - - - - - - -
---GCCCGCCAAGCGCAGGCTCTCATTTTGAAAATC------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P F K R Y A L G Q S Y R G E R Q A R G R Y R E F
- F K R Y A L G Q S Y R G - - - - - - - - R E F
---TGGGCGTGGCCCCATATTAAGCTCAAGCATCAAATC------------------------ACAGCCAAC
121122123124125126127128129130131132133134135136137138139140141142143144
W Q L D A D I V G V D S P I A D A E I V A V V V
W Q L D A D I V - - - - - - - D A E I V A V V V
CGTCGGCAACGAGCGTTTGCTAAA---------------------GCGGCCACCGCCCAATAACGAACCCAT
145146147148149150151152153154155156157158159160161162163164165166167168
E G L R A L G F T G A K V L L N H R E I L S G L
E G L R - - - - - - - - - - - - - - - - - - - -
CGGTGGCGAATC------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A R V A G V P E N E A G G V Y R A I D K L D K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G N D G V R N E L L K S G V S A E A A E R V L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F V G I S G S I E A V L A E M E S V L A N D P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A L A A V A A L R T I C E V L T S F G V P A D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F T I A P S L A R G L S Y Y T G C V F E A V L D
- - - - - - - - - - - - - - - - - V F E A V L -
---------------------------------------------------ACCAGTAAAGCCTAAAGC---
289290291292293294295296297298299300301302303304305306307308309310311312
S P P M G S L L G G G R Y D N L V G M F S K R S
- - - - - S L L G G G R Y - - - - - - - - - - -
---------------CACCGCCACAATTTCAGCATCGGC---------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L P T V G C A F G L E R L F D L M L E L N M G P
L P T V G C A F G L E R L F D L - - - - - - - -
AAGCTGCCAAAATTCGCGGTAGCGACCACGAGCTTGGCGTTCGCCGCG------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R P E R T I D A Y V T L F A G D F Q N E S L R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A G E L R V A G L S V L T A Y S P V K I A N Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K E A D R K G A N F A L V L G P D D L A A G V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q L K D L R S G Q Q Q A V A R D A I V A A I K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434
A Q
- -
------
Class II
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_his_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T E Q K R K L E K L T G V K G M N D I L P Q D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A G L W E F F E A T V K S L L R A Y G Y Q N I R
- - L W E F F E A T V K S L L R A Y G Y Q N I R
------TTGTGGGAATTCTTCGAAGCGACGGTGAAGTCGCTGTTGCGCGCATACGGCTATCAGAATATCCGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T P I V E H T P L F T R G I G E V T D I V E K E
T P I V E - - - - - - - - - - - - - - - - - - -
ACGCCGATCGTCGAG---------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M Y S F V D A L N G E N L T L R P E N T A A V V
- - - - - - - - - - - - - T L R P E N T A A V V
---------------------------------------ACGCTGCGTCCCGAGAACACCGCGGCCGTCGTG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R A A I E H N M L Y D G P K R L W Y I G P M F R
- - - - - - - - - - - - - K R L W Y I G P M F R
---------------------------------------AAGCGACTGTGGTACATCGGGCCGATGTTCCGT
121122123124125126127128129130131132133134135136137138139140141142143144
H E R P Q R G R Y R Q F H Q V G V E A L G F A G
H - - - - - - - - R Q F H Q V G V E A L - - - -
CAC------------------------CGCCAGTTCCATCAGGTCGGCGTCGAGGCGCTC------------
145146147148149150151152153154155156157158159160161162163164165166167168
P D A D A E I V M M C Q R L W E D L G L T G I K
- - - D A E I V M M C Q R L W E - - - - - - - -
---------GACGCGGAAATCGTCATGATGTGCCAGCGCCTGTGGGAG------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L E I N S L G L A E E R A A H R V E L I K Y L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q H A D K L D D D A Q R R L Y T N P L R V L D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K N P A L Q E I V R N A P K L I D F L G D V S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A H F E G L Q R L L K A N N V P F T I N P R L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R G L D Y Y N L T V F E W V T D K L G A Q G T V
- - - - - - - - - V F E W V T - - - - - - - T V
---------------------------GTGTTCGAGTGGGTGACC---------------------ACGGTC
289290291292293294295296297298299300301302303304305306307308309310311312
A A G G R Y D P L I E Q L G G K P T A A C G W A
A A G G R Y - - - - - - - - - - - T A A C G W A
GCCGCGGGCGGCCGCTAC---------------------------------ACCGCCGCGTGCGGCTGGGCG
313314315316317318319320321322323324325326327328329330331332333334335336
M G I E R I L E L L K E E H L V P E Q E G V D V
M G I E R I L E L - - - - - - - - - - - - - - -
ATGGGCATCGAGCGCATCCTTGAGCTT---------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y V V H Q G D A A R E Q A F I V A E R L R D T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L D V I L H C S A D G A G A S F K S Q M K R A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A S G A A F A V I F G E D E V T N G T A S V K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L R G T G D D G E K S V Q Q S V P V E S L T E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446
L I N A M V A T A E D G D D
- - - - - - - - - - - - - -
------------------------------------------
Class II
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_his_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K Y R R I K G T N D I F G E E I W Y W R Y V E
- - - - - - - - - - - - - - - - - - Y W R Y V E
------------------------------------------------------TACTGGAGGTACGTCGAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E T F R N V C E S A G I E E I R T P I F E Q T E
E T F R N V C E S A G I E E I R T P I F E - - -
GAAACCTTCAGAAATGTGTGCGAAAGCGCGGGAATAGAGGAGATCAGAACTCCCATATTCGAA---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F V R S V G E E S D I V Q K E M Y T F Q D K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R S I T L R P E G T A P V V R A F L E N S L I
- - - - T L R P E G T A P V V - - - - - - - - -
------------ACTCTGAGACCAGAAGGTACCGCGCCCGTCGTC---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D R G F Q Q R Y Y Y I G P M F R Y E K P Q S G R
- - - - - Q R Y Y Y I G P M F R Y - - - - - - -
---------------CAGAGATACTACTACATAGGTCCCATGTTCCGATAC---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L R Q F H Q V G F E I I G P E S P K A D F E V I
- R Q F H Q V G F E I I - - - - - - - D F E V I
---AGACAGTTTCACCAGGTGGGTTTCGAGATCATC---------------------GATTTCGAGGTGATC
145146147148149150151152153154155156157158159160161162163164165166167168
M L V D T F L R R L G L T K Y K I H L N S I G C
M L V D T F L R - - - - - - - - - - - - - - - -
ATGCTGGTTGATACCTTCTTGAGA------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P V C R K N Y R E A L K E Y Y G R I L D N L C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D C K R R Y E T N I L R L L D C K V D H E Y S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N A P K S V D Y L C D S C R A H Y K K L K E Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N T F E I E Y V E D H T L V R G L D Y Y T R T V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GTT
265266267268269270271272273274275276277278279280281282283284285286287288
F E V R H E G L G A Q S A I A G G G R Y D G L F
F E V R H - - - - - - - A I A G G G R Y - - - -
TTTGAGGTGAGGCAC---------------------GCCATCGCGGGTGGTGGAAGGTAC------------
289290291292293294295296297298299300301302303304305306307308309310311312
A E L G G S S V P A L G F A G G I E R I I L A L
- - - - - - - V P A L G F A G G I E R I I L A -
---------------------GTACCCGCCCTTGGTTTTGCAGGTGGTATAGAGAGAATTATACTCGCT---
313314315316317318319320321322323324325326327328329330331332333334335336
K A E G I E I P M K N V H L V Y I A T L G E K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F M D G V R L A G E L R K K G L S V D V D I M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R K L S G Q L K H A S R M G S R Y A V I I G D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E L E K G I V I L R D L E T G D Q V E I D R D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420
A A D Y I A E R V S K D
- - - - - - - - - - - -
------------------------------------
Class II
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_his_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N I Q S V R G F H D I L G K D A K K F R K I S
- - - - - - - - - - - - - - - - - - K F R K I S
------------------------------------------------------CGTCACTTCCTGGTTCTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D T A R K I L K L Y N F E E I I L P V V E Y A E
D T A R K I L K L Y N F E E I I L P V V E - - -
CACCTCGTCTTCACCGATGATAACGGCGTATTTAACGCCGAGTTTGTCGGCAAACTCCAGTTG---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F Q R S V G E T T D I V Q K E M F V F E D R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R K L A L R P E G T A G T V R A F I Q H K L Y
- - - - A L R P E G T A G T V - - - - - - - - -
------------TCCGAAGGGAATGACGAAGTAAACCTCTTCTTT---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A L R P Y V K L F Y E G P M F R Y E R P Q A G R
- - - - - V K L F Y E G P M F R Y - - - - - - -
---------------AAGGGCAAACCCGAGGGCGGGAGTGGGAGGACCTCC---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y R Q F H Q I G A E V F G V A E P H A D A E I I
- R Q F H Q I G A E V F - - - - - - - D A E I I
---CCTCCCGCCTGCGATTAGCGTGAGTCCGAGCTC---------------------GGTCCTAGTGTAGTA
145146147148149150151152153154155156157158159160161162163164165166167168
K I V Y D I L Q A L G I K G V V V E I N S L G C
K I V Y D I L Q - - - - - - - - - - - - - - - -
ATCAAGCCCCCTCACGAGGTTGTA------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K K D R E A Y R E A L L N Y L T G V K E E L C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D C I S R M D R N P L R V L D C K V E T C K V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V R E A P K M I D F L C D E C R E H Y E K L K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y L K A L D I P F R E N Y N L V R G L D Y Y T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T V F E A V S D E L G L T L I A G G R Y D Y L V
- V F E A V S - - - - - T L I A G G R Y - - - -
---CGCGTGAGGTTCTGCAAC---------------ACCTATCTGGTGGAATTGCCTATA------------
289290291292293294295296297298299300301302303304305306307308309310311312
E E L G G P P T P A L G F A L G V E R L M L L L
- - - - - - - T P A L G F A L G V E R L M L L -
---------------------AGGTCCCTCGTAAAAGAGCTTCACATAAGGTCTCAGAGCGTAGAGTTT---
313314315316317318319320321322323324325326327328329330331332333334335336
P D E E E K E E V Y F V I P F G D V H E Y A L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V A D I L R K K G K V V E Y S Y R K G G L K K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L E F A D K L G V K Y A V I I G E D E V K N Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403
V T I K D M E T G E Q R R V K L S E L
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_his_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S A E K A P A L I T P R T L S G F R D Y L P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V M L A R E E V L R R A R E V Y R S Y G F T P I
- - - A R E E V L R R A R E V Y R S Y G F T P I
---------CTTCCACACGCCCTGCTCGAACTCCGCGGGGCCGGCGATCACCGCGAGCTTGAACCCGCGCTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D T P A C E S L D V L L G K G G D E S D K L V Y
D T P A C E - - - - - - - - - - - - - - - - - -
CTCGGCGTACCCGAGCTG------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R V L S A R G D K A E M G L R F D L T V P F A R
- - - - - - - - - - - - G L R F D L T V P F A -
------------------------------------GGCGGCGTCGAAGTTGACCACCAGCACTTGCGC---
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F S A Q Y I N E L G T P F K R Y A M G P V W R G
- - - - - - - - - - - - F K R Y A M G P V W R G
------------------------------------CTCCATCGCGGCGATGAGCCGGTCGACCCCGAGCGA
121122123124125126127128129130131132133134135136137138139140141142143144
E R P G Q G R Y R E F W Q C D F D T I G T T S N
- - - - - - - - R E F W Q C D F D T I - - - - -
------------------------CTTCGTGTACTTGCTCGCGAGGTTGTCGTACCG---------------
145146147148149150151152153154155156157158159160161162163164165166167168
A A D I E A A L V I N D L F T A L Q F D R F E I
- - D I E A A L V I N D L F T - - - - - - - - -
------GATCCCCGGGAGGTCGGTCAGGAAGGTCTCGTAAATGGT---------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R I N N R M V L N G L L E S L G I A D K A A P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L R S L D K L L K I G R E K V A E E M V R E A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I T P E Q A N R V L M M T D L T G P N E Q L L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D L E A W F G G A N E K A T A G I R C L R E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T V A K A A G V A E G R I K I D L S I C R G L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y Y T G T I Y E T F L T D L P G I G S V C S G G
- - - - - I Y E T F L - - - - - - - S V C S G G
---------------GAACAGGTCGTTGATGAC---------------------GGCGTTGGAGGTGGTGCC
313314315316317318319320321322323324325326327328329330331332333334335336
R Y D N L A S K Y T K Q V L P G V G A S L G V D
R Y - - - - - - - - - - - L P G V G A S L G V D
GATGGT---------------------------------GCCCTGCCCCGGGCGCTCGCCGCGCCACACCGG
337338339340341342343344345346347348349350351352353354355356357358359360
R L I A A M E E L K H P L L T G A T T P A Q V L
R L I A A - - - - - - - - - - - - - - - - - - -
CCCCATCGCGTACCG---------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V V N F D A A R L G D Y Q R I A R A L R A A G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S V E V F P D A K K V G V Q L G Y A E K R G F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L A V I A G P A E F E Q G V W K V K D L A K R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450
E K T I V E A E V V G A V Q S A V G
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_his_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V Y Q S P A G A R D L L P L D V A Q K H W V E
- - - - - - - - - - - - - - - - - - Q K H W V E
------------------------------------------------------GGAACCGTCATCTTTGAG
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E R L Q Q V F H R W G Y H R I I T S T L E R L D
E R L Q Q V F H R W G Y H R I I T S T L E - - -
CCAAGCAATTTGTTGGATGCGGCGCTGGCGGGCGTAGGTGCGGATTTCCTCTGGTTGGCGATC---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T L M A G G A I Q R S T V I Q V Q D R E E E L G
- - - - - - - - - - - - - - - - - - - - - - - G
---------------------------------------------------------------------TGG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L R P E L T A S I A R T A V T R M A G A T F P Q
L R P E L T A S I A - - - - - - - - - - - - - Q
CGATCGAGCGACAACGAGCCAATCACTAGC---------------------------------------TTG
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R L Y Y N A N V F C R T P D S S H N R Q L E F Y
R L Y Y N A N V F C R - - - - - - - - - L E F Y
TTGTAAATCTTCCGTGTTGAGGACAAAGCCAAC---------------------------ATACAGTCCTAA
121122123124125126127128129130131132133134135136137138139140141142143144
Q T G V E L L G S E G L L A D A E V L L L L A E
Q T G V E L L - - - - - - - D A E V L L L L A E
AAGTTGGTCGTAACGACCTCC---------------------AGCTGTTAGATTGTCGATCGCTGCATTGCC
145146147148149150151152153154155156157158159160161162163164165166167168
C L N E L G L H N W Q L I L G E A E I T Q S L L
C L N - - - - - - - - - - - - - - - - - - - - -
GATGACTTC---------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A S F P A S G R D R V R Q A I A H L D R V T L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T L P L S E D L R A R A L V M L D L R G H P A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V L Q K V T K L S L D A P Q Q A A L H R L K S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V E I L D R C F S V D S N Q N S Q N F P I I L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L S M I R T F D Y Y T G I V F E V I G N A A I D
- - - - - - - - - - - - - V F E V I G - - - - -
---------------------------------------CAATTCATTCAAGCACTC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
N L T A Q P Q I L G Q G G R Y D Q L L G L Y H P
- - - - - - - I L G Q G G R Y - - - - - - - - -
---------------------TCCTTCGCTACCCAGCAACTCCAC---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q G K T I P G V G F V L N T E D L Q Q A L L S A
- - - - I P G V G F V L N T E D L Q Q A - - - -
------------ATCGGGCGTGCGACAAAAGACGTTAGCGTTGTAGTAGAGGCGTTGCGG------------
337338339340341342343344345346347348349350351352353354355356357358359360
D R L P Q A T P A S D W L V V A R S P A A Y A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A F A Y A E K L R C T P G L R V E M D L G D R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P E E I R T Y A R Q R R I Q Q I A W L K D D G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425
A E I E T L K R E Q G R A G S K E
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_his_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M M W Y N L T I K Q L K N V R N F M I Q K P K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T S D F F L E K A D L F Q Y I L D T F R K E A E
- - - - - - - - - - L F Q Y I L D T F R K E A E
------------------------------TTATTTCAATACATATTAGATACTTTTAGAAAAGAAGCTGAA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F N Y S Y I Q T P I L E F Y D L F Y R S V G E
L F N Y S Y I Q T P I L E - - - - - - - - - - -
TTATTTAACTATAGTTACATTCAAACTCCAATTTTAGAA---------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T T D V V S K E M F I F N D R S E R K M A L R P
- - - - - - - - - - - - - - - - - - - - A L R P
------------------------------------------------------------GCTTTAAGACCA
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E K T A G V I R S L V E N K L I F N A E N K F Y
E K T A G V I - - - - - - - - - - - - - N K F Y
GAAAAAACAGCTGGAGTAATT---------------------------------------AATAAATTCTAC
121122123124125126127128129130131132133134135136137138139140141142143144
Y Y G S M F R Y E R P Q K G R Y R E F T Q I G C
Y Y G S M F R Y - - - - - - - - R E F T Q I G C
TACTATGGATCTATGTTTAGATAT------------------------AGAGAATTTACACAAATTGGTTGT
145146147148149150151152153154155156157158159160161162163164165166167168
E W I E D N S D F S D F E I L L F A S K F L G N
E W I - - - - - - - D F E I L L F A S K F L G -
GAATGAATA---------------------GATTTTGAAATTTTACTATTCGCTTCAAAATTTTTAGGC---
169170171172173174175176177178179180181182183184185186187188189190191192
F N F N K V I L K I N N L G N K V E R E N Y L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E L K K Y F Y K F K D K F D E I S L K R L E K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P L R I L D D K E I N H Q D F I K N A P K L F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F L N S E T V Q K F N N L Q N Y L R K S N I S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E I D Y S L V R G F D Y Y N N L V F E F V Y Y D
- - - - - - - - - - - - - - - - V F E F V Y - -
------------------------------------------------GTTTTTGAGTTTGTCTAT------
289290291292293294295296297298299300301302303304305306307308309310311312
E E S R S E L T I L G G G R Y S N L I E E L G G
- - - - - - - T I L G G G R Y - - - - - - - - -
---------------------ACAATTTTAGGTGGTGGAAGATAT---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P K K D A I G F A A G V E R L M I L L K E K E W
- - K D A I G F A A G V E R L M I L - - - - - -
------AAAGATGCAATTGGTTTTGCAGCTGGTGTGGAAAGATTAATGATTTTA------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E K P I K T S I F V F N K D H E D L Y K N F D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V Y K L R K R D L V V K Q N V S N F K L Q K I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S K I V N E G I K F L I F F D E K L N Q I I I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N L I N K N F L D L T N K S Q E E K I N L V K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445
F I E S E N K N E N N S K
- - - - - - - - - - - - -
---------------------------------------
Class II
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_his_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G F N I P R G T Q D I L P G E S E R W Q Y V E
- - - - - - - - - - - - - - - - - - R W Q Y V E
------------------------------------------------------CTGTTGATCTCCTGTTTT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K I A R E T C H A Y Q Y K E I R T P I F E H T E
K I A R E T C H A Y Q Y K E I R T P I F E - - -
CCCATCTTTGACATTAATTTGATTTTGGTTCAGTTCATCCTCGCCCAAAACAGCGATATATTT---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L F S R G V G E S T D I V Q K E M Y T F A D K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R S L T L R P E G T A S A V R S F V E N K L F
- - - - T L R P E G T A S A V - - - - - - - - -
------------GAGAAGGGATACGGAATAGTCTTTGGCTTTGTC---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A N P V Q P T K L Y Y I G P M F R Y E R P Q T G
- - - - - - T K L Y Y I G P M F R Y - - - - - -
------------------TTTTACATTTTCAGCATCCAGTGCGGCGAGAAGGCG------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R Y R Q F Y Q F G I E A I G S N D P A I D A E V
- - R Q F Y Q F G I E A I - - - - - - - D A E V
------GCCCGGCGCTTTCGGACCGCCGAACTCCTCGGT---------------------GCCGGCAAGCGT
145146147148149150151152153154155156157158159160161162163164165166167168
I A L A M S V Y R K A G L N N L K L V I N S L G
I A L A M S V Y R - - - - - - - - - - - - - - -
CGTAATCGCTCCGAAGCCTTCGGCATT---------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D K E S R T A H R E A L I R H F E P R I D E F C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S D C Q K R L R Q N P L R I L D C K K D R D H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L L K T A P S I L D Y L N E E S K A Y F A K V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Q Y L T D I G I A F E V D P N L V R G L D Y Y N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H T A F E I M S N A E G F G A I T T L A G G G R
- - A F E I M S - - - - - - - - - T L A G G G R
------GTTGCTGAGACCCGCTTT---------------------------GACCTCCGCGTCAATCGCCGG
289290291292293294295296297298299300301302303304305306307308309310311312
Y D G L T E E F G G P K A P G I G F A M S I E R
Y - - - - - - - - - - - A P G I G F A M S I E R
ATC---------------------------------AAATTGGCGGTAGCGGCCCGTCTGCGGCCTTTCATA
313314315316317318319320321322323324325326327328329330331332333334335336
L L A A L D A E N V K V G A D E G I D C Y I V T
L L A A - - - - - - - - - - - - - - - - - - - -
GCGGAACATCGG------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L G D K A K D Y S V S L L Y K L R E A G I S A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I D Y E Q K K M K G Q F K S A D R L N A K Y I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V L G E D E L S Q N Q I N V K D A K T G D Q Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424
I G L D E F I R F L K T N T E S
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_his_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D I K T L K G F K D Y L P K D S L I R I H I V
- - - - - - - - - - - - - - - - - - I R I H I V
------------------------------------------------------TTCAAAAGAAAGCAGCAA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R Q I F S V L N S Y N F D L I D T P V L E Y S D
R Q I F S V L N S Y N F D L I D T P V L E - - -
CTCTTCTTTTTTTGTCAAATCTCTTACTTTCATTTTATTTTCTTTGTATTCTTCTTGACCAAC---------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L L L K K S G D E T E K Q I Y R F K D N G G R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V S M R F D L T V P F A R F V A T N I S A L K L
- S M R F D L T V P F A - - - - - - - - - - - -
---TTCACAAGAAATATTTTTAACCTTGGAATAATC------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P F R R S Q F G K V F R G E N S Q K G R Y R E F
- F R R S Q F G K V F R G - - - - - - - - R E F
---TTGCAAAGCACTATCTAAATTTACAATTAAAACTTT------------------------TTTAATATA
121122123124125126127128129130131132133134135136137138139140141142143144
M Q F D F D I V G E D T F R G D A E I L S V V Y
M Q F D F D I V - - - - - - - D A E I L S V V Y
ACTAAACTTTTCAAGATCAATTAT---------------------AAAAGATCCTCCAACCCCTGAAATTTT
145146147148149150151152153154155156157158159160161162163164165166167168
Y G L E E I F L N F I E G I N K K F I I H Y S H
Y G L E - - - - - - - - - - - - - - - - - - - -
TTGAATAGAGTT------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I G I L N S F F E K L G L K E K S I F I L R N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D K I D K I G I D K V K E A L L L E I E K E A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D S I L S L V S L Q G T F K D K I Q A L K S I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G D N E S I K R V E D V F Q H L S L L K I Q D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F N L N L K I S R G L D Y Y T G I V F E S E V F
- - - - - - - - - - - - - - - - - V F E S E V -
---------------------------------------------------AAAAAAAGAATTCAATAT---
289290291292293294295296297298299300301302303304305306307308309310311312
G S N M G S V C S G G R Y D N L V S S F S N S I
- - - - - S V C S G G R Y - - - - - - - - - - -
---------------GATAATAAATTTTTTATTAATGCC---------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q K I S G V G G S F G V D R I K D I I D L E K F
- - I S G V G G S F G V D R I K D I - - - - - -
------TACAACAGAAAGAATCTCGGCATCGCCCCTAAAAGTGTCCTCTCCAAC------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S Y I K I F V T K A R S K V L I V N L D S A L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N Y Y Y E L A T R F R N H D Y S K V K N I S C E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V Y F K N K N G K N I K E Q I E Y A L S K E I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F L V F V G Q E E Y K E N K M K V R D L T K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E L L L S F E E S I N L I K C N E K L L C T P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_his_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q E R Q T P Q L V K G T R D F N A L Q V A Q R
- - - - - - - - - - - - - - - - - - - - - - Q R
------------------------------------------------------------------CAACGA
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S Y I F D T I R Q V Y Q K Y G F S P L E T P A L
S Y I F D T I R Q V Y Q K Y G F S P L E T P A L
AGCTATATATTTGATACAATTAGGCAGGTTTACCAAAAATATGGATTTTCACCTTTAGAAACTCCTGCCTTA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E Y V S T L F G Q Y G Q E G E Q L V F R V L N S
E - - - - - - - - - - - - - - - - - - - - - - -
GAA---------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G N F L G D T P Q A L L I D Q N Y K E V L P K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E K G L R Y D L T V P L M R Y V A T H Y H E L
- - - G L R Y D L T V P L M - - - - - - - - - -
---------GGACTTCGTTATGATTTAACCGTTCCTTTAATG------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T L P F R R Y Q I Q P V W R A D R P Q K G R Y R
- - - F R R Y Q I Q P V W R A - - - - - - - - R
---------TTTAGGCGTTATCAGATACAGCCAGTATGGCGAGCG------------------------AGG
145146147148149150151152153154155156157158159160161162163164165166167168
E F Y Q C D A D V V G T P S L I V E A E I L A M
E F Y Q C D A D V V - - - - - - - E A E I L A M
GAATTTTACCAATGTGATGCAGACGTAGTG---------------------GAGGCAGAAATTCTGGCTATG
169170171172173174175176177178179180181182183184185186187188189190191192
A Y E V L Q R L G I N D F I I H L N H R S I L N
A Y E V L Q - - - - - - - - - - - - - - - - - -
GCTTATGAGGTTTTGCAA------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G I A S Q I G E L E R V N E F C T I V D K L D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V G K D K V I T E L L S K G F S E A G L E K F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F I F D L Q G D N N A K L D I L S N H L A H D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V G S K G L Q E L K E I L Q Y L E A L G M T Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P I S F E P S L A R G L A Y Y T G A V F E V K L
- - - - - - - - - - - - - - - - - - V F E V K L
------------------------------------------------------GTTTTTGAAGTAAAATTA
313314315316317318319320321322323324325326327328329330331332333334335336
P T I N I G S I A G G G R Y D N L A E H F G V S
- - - - - - S I A G G G R Y - - - - - - - - - -
------------------AGTATAGCAGGAGGAGGGAGATAT------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S L T G V G F S F G V D R L Y V A M E Q L N L F
- L T G V G F S F G V D R L Y V A - - - - - - -
---CTAACAGGTGTAGGCTTTTCTTTTGGAGTAGATAGGCTATACGTAGCA---------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P Q Q A Y F N T K V M V T N L D E E S V K V A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D I I T R L R N H D I P A E L Y P E K V K L K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q L M Y A N K K D I P F V L I I G E E E R Q A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K F T L K D M S T G D Q A F Y T F D Q L I N I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458
S N
- -
------
Class II
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_his_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A I Q R P K G T N D L L P S G S P K T E A F Q
- - - - - - - - - - - - - - - - - - K . . . . .
------------------------------------------------------GTG---------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R A A A H E W L I A Q A R E V L E R A G A Q R I
. . . . H E W L I A Q A R E V L E R A G A Q R I
------------GGCGGCTTCCTCCGACCCGATGAGGCCCACCCACACGGCGCCCCGGCGCTCGGCGTCCTT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D T P M F E E A E L V K R G V G G S T D I V R K
D T P M F E - - - - - - - - - - - - - - - - - -
GAAGGCGCTGCCCGGTTT------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E M F T V Y Y F G D H G G Y V L R P E G T A S I
- - - - - - - - - - - - - - V L R P E G T A S I
------------------------------------------GTAGAGCTGCGGCCCGCCGCTGCCCGGAAT
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V R A Y L E N G L K Q L P A P L K L W T S G P M
V - - - - - - - - - - - - - - L K L W T S G P M
CTC------------------------------------------GAACGCCCAGCCGATGCCCGGCACGCT
121122123124125126127128129130131132133134135136137138139140141142143144
F R A E R H Q K G R Y R Q F T Q V D Y E V L G S
F R A - - - - - - - - R Q F T Q V D Y E V L - -
GCCGCCGCC------------------------GCGCCCGCCGCCGCCCAGGGCCGACTTGGCGCC------
145146147148149150151152153154155156157158159160161162163164165166167168
A D A L V D A E A I A L M V A V V Q K L G L R G
- - - - - D A E A I A L M V A V V Q - - - - - -
---------------CCAGGCGGTGCGGCGGTAATAGTCCAGCCCGCGCACGAT------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V R V K L G S I G D P E D R E R Y N A Y L R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F S P H L G R L S D D S K D R L E R N P M R I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D S K S A S D Q E L L A E L S V R P M L D F L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E G A A A D F R Q V Q A Y L S D W G V P F D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P S I V R G L D Y Y R R T A W E L H Y E G I G A
- - - - - - - - - - - - - A W E L H Y - - - - -
---------------------------------------GGCGTCGACGAGCGCGTC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
K S A L G G G G R Y D G L S E Q L G G G S V P G
- - A L G G G G R Y - - - - - - - - - - - V P G
------ATCCACCTGCGTGAACTGGCGGTA---------------------------------CGGCCCCGA
313314315316317318319320321322323324325326327328329330331332333334335336
I G W A F G V E R L L L A L E Q E G I E I P G S
I G W A F G V E R L L L A - - - - - - - - - - -
GGTCCAGAGCTTGAGCGGCGCGGGCAGTTGCTTGAGCCC---------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G G P Q L Y V A A L D E E N V P L A A R V A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A R A S C R A E F A Y R A M K P G S A F K D A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R R G A V W V G L I G S E E A A A G T L S L K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427
L H T G E Q K T V P V G E L G Q A L A
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Eukaryotes/Capsaspora owczarzaki/amino acid sequences/Cowczarzaki_his_aa
Eukaryotes/Capsaspora owczarzaki/nucleotide sequences/Cowczarzaki_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T T A F T M P A A A T T Y A T R G E L G L S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S S R Q W K S S G A T P A K T A R P Q L S Q L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R G M R D V V P A V A L S Q A R V T Q T F G E V
- - - - - - - - - - - - S Q A R V T Q T F G E V
------------------------------------AGTCAAGCACGCGTCACACAGACGTTCGGGGAGGTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T A N L G F G E V E T P I V E Q E S L F K R S I
T A N L G F G E V E T P I V E - - - - - - - - -
ACTGCCAACCTGGGCTTTGGCGAGGTCGAAACGCCGATCGTCGAG---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G A D S S V V M K E M Y A F D D P D G G R L C L
- - - - - - - - - - - - - - - - - - - - - - C L
------------------------------------------------------------------TGCTTG
121122123124125126127128129130131132133134135136137138139140141142143144
R P E G T A G V M R A V L Q R L A A E P T P S I
R P E G T A G V M - - - - - - - - - - - - - - -
CGCCCGGAAGGCACCGCTGGAGTGATG---------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N A D V H A S L C Y T G P M F R R E K P Q A G R
- - - - - A S L C Y T G P M F R R - - - - - - -
---------------GCGAGTCTTTGCTACACGGGACCCATGTTCCGTCGA---------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y R Q F L Q C G V E Y L G S A G V D A D G L V L
- R Q F L Q C G V E Y L - - - - - - - D G L V L
---CGTCAGTTTCTGCAGTGCGGCGTCGAGTACCTG---------------------GATGGCCTCGTCCTG
193194195196197198199200201202203204205206207208209210211212213214215216
Y A A W R L I R E L G L S S Q V V L Q L N T L G
Y A A W R L I R - - - - - - - - - - - - - - - -
TACGCTGCCTGGCGTCTCATCCGT------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T S A E R Y R Y V Q A L R D Y L E P R A N E L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G E S L S R L R G R T P V V A T G S D E L R Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A A G A S T T S A A E D T G I V G R V L R I L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S K H A Q D H A V L E A A P L L S D F L D P S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H A R F A E L K E T L E A L A I P F T V N P R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V R G L D Y Y S H T V F E I V A N S G V L G A Q
- - - - - - - - - - V F E I V A - - - - - - - -
------------------------------GTTTTTGAAATTGTTGCA------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S T V L A G G R Y D E L S L V L G G K R K V P A
- T V L A G G R Y - - - - - - - - - - - - V P A
---ACAGTACTAGCTGGTGGGAGGTAC------------------------------------GTGCCGGCT
385386387388389390391392393394395396397398399400401402403404405406407408
V G W A A G V E R L S L A R A S T P Q G P S S K
V G W A A G V E R L S L A - - - - - - - - - - -
GTCGGATGGGCTGCCGGTGTCGAGCGGCTTTCACTCGCC---------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T G Q A E C G L A A P P A E Q P L G P F A V P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S V F L S S R P N A I Q A G R L A R V G I L I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P P K P V Y P D Q Q Q S A P A A V S P Q L S P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q L V S L L Y Q T V E E L N Q K G I C T I P I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V R S R E C T D K P A T S S R S V P M L G D Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R A A A R H G L E H V V L L Y P D Q A A T G T A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V V R H L A S A H Q Q S V S L T S L A T H V L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579
L S S
- - -
---------
Class II
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_his_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S S T A S P N A A L L A E I N D L K V K L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K E A L L Q P E G V V S K K S K K K S Q A N M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E K E P V Q G C R D F P P E D M R V R R H L F G
- - - - - - - - - - - - - - - - - V R R H L F G
---------------------------------------------------GCCCTTGTCACGCAGCTGCTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V F H D T A R R F G F E E Y D A P V L E S E E L
V F H D T A R R F G F E E Y D A P V L E - - - -
CAATACCTTCAGGGCGGTGCCTCGCTGAGACTCATTGAACGGAATCACCACATCATCCAC------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y I R K A G E E I T E Q M F N F V T K G G H R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T L R P E M T P S L V R L Q L A K G R S L L L P
T L R P E M T P S L V - - - - - - - - - - - - -
GACAGGCTGCGGGCTGCCGTACAGAGTGAAGAG---------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A K W Y S I P Q C W R Y E A I S R G R R R E H Y
A K W Y S I P Q C W R Y - - - - - - - - R E H Y
ACCACTGCGGTCAAACGCTTCGAAAACGATGCCGGT------------------------ACTCGCATCGAA
169170171172173174175176177178179180181182183184185186187188189190191192
Q W N M D I V G V K S V A A E V E L V C A A C A
Q W N M D I V - - - - - - - E V E L V C A A C A
CTGGATCCAGTCGCCGTACCC---------------------GAACTCTGCGAGCTCCGAGAGGGCGCCGTT
193194195196197198199200201202203204205206207208209210211212213214215216
A M E S L G L T A Q D V G V K V N S R K L L Q C
A M E - - - - - - - - - - - - - - - - - - - - -
CTTGTCAAA---------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A L A G A G V P D S L F A P V C V I V D K M E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L P E E Q I R A E L K D L A L D G Q Q A D D I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K T L S L R S V D D F D K D L F D K N G A L S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L A E F F S Q M Q M Y G Y G D W I Q F D A S V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R G L A Y Y T G I V F E A F D R S G E F R A I C
- - - - - - - - - V F E A F D - - - - - - A I C
---------------------------GCACTGCGGAATGGAGTA------------------CAGAGAGCG
337338339340341342343344345346347348349350351352353354355356357358359360
G G G R Y D N L F T L Y G S P Q P V S C V G F G
G G G R Y - - - - - - - - - - - - V S C V G F G
GCCCTTGGCGAGCTG------------------------------------TGTGACACGGTGGCCACCCTT
361362363364365366367368369370371372373374375376377378379380381382383384
F G D C V I V E L L K K K K L I N S L P H K V D
F G D C V I V E L - - - - - - - - - - - - - - -
CGTCACAAAGTTGAACATTTGTTCTGT---------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D V V I P F N E S Q R G T A L K V L K Q L R D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G R S A D I I M D S K K V A Q T F S Y A D R I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A D R A V L I A P D E T E K G M A R V K M L R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473
G Q R G E D D R G D P V P F E D L
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_his_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V Q N G K E S F F I G S G G I S L E D V A L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S T S D K S E F V L E P K L R E S E E L E Q L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D G D F W T G D N E M G M V Q E G K E L S L S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V R A L M L T K A V G I A I D G K G I S K K L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M W L L E Q L R N K G S T L V K V K Y L S T D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L T L T N L L G E Y L R I S G H K V S K R D A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A F T K G F S M T V S Q L A L Y L G I S S S L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S F G E C T L A I L V E A M S F P L C F L A H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S S I S S G G L A E T T R N V R W L L E D S K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q R E N R W K N K S L G V K L S E I L C S L G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L Q N S I E N L S K C I K G F Y A K S G N V T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S T K G I E N S I D Y I E I M P I L E P L K N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I S S L N Y M K K S S I E F L D L F L R D T I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E E I V S E N D F S K F A L D S E I S V Q G L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I E Q I S K S V T P L T I E D L S H I N S R I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E M I N G Q F D S S I I L R I S T M E E S K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I D A L K V L T N E N I E I F T I I C I L S L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K L A D K N Y Q Q Y L S T I E K A K K K G K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V S I A S H E S K N I H E F R Q F M I N L I L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S S I F E S S K N G V E S N I Y S K I L E I F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
D G Q I C K L D S T L K Y I T T P Q N Q S L R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P K I P K G T Q D V T P Q K M A I K N L V F G M
- - - - - - - - - - - - - - - - I K N L V F G M
------------------------------------------------TGATGAATTTAATATCAAGTTAAT
529530531532533534535536537538539540541542543544545546547548549550551552
I R E V Y R A H G A V E I D T P V F E L K D T L
I R E V Y R A H G A V E I D T P V F E - - - - -
CATAAATTGTCTAAATTCATGGATATTCTTTGATTCATGAGAAGCTATCGAAACTTC---------------
553554555556557558559560561562563564565566567568569570571572573574575576
L G K Y G E D S K L I Y D L K D Q G G E Q L S L
- - - - - - - - - - - - - - - - - - - - - - S L
------------------------------------------------------------------AATACA
577578579580581582583584585586587588589590591592593594595596597598599600
R Y D L T V P L A R Y I A T S G L D H L K R Y Q
R Y D L T V P L A - - - - - - - - - - L K R Y Q
AATAATTGTAAAGATTTCAATATTCTC------------------------------TTCCTTAGACTCCTC
601602603604605606607608609610611612613614615616617618619620621622623624
I G K V Y R R D E P Q M A R G R F R E F Y Q C D
I G K V Y R R - - - - - - - - - - R E F Y Q C D
CATTGTAGATATTCTTAATAT------------------------------TTCACTAATTCTAGAGTTAAT
625626627628629630631632633634635636637638639640641642643644645646647648
L D I V G H Y D S M V A D S E I I K I A T Q V L
L D I V - - - - - - - - D S E I I K I A T Q V L
ATGAGACAAATC------------------------CTTTGATATCTGCTCTATATTTAAACCTTGTACTGA
649650651652653654655656657658659660661662663664665666667668669670671672
S S F S N W I G Q F M I K I N H R Q L L D G I L
S - - - - - - - - - - - - - - - - - - - - - - -
TAT---------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E I S G V P N E K F K T T C S S I D K L D K E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
W E S V R N E M I N I K G L S E S T V D K I G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
I I Q L K G T P F D V L E K I K S N Q E M M E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
K N I M K A L E E L E T L F K Y T K S C N N C I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
N Y L S F D L S L A R G L D Y Y T G V I Y E A V
- - - - - - - - - - - - - - - - - - - I Y E A V
---------------------------------------------------------GTGAGCTAAAAAGCA
793794795796797798799800801802803804805806807808809810811812813814815816
L I S N E L N V G S I A A G G R Y D Q L I G M F
L - - - - - - - - S I A A G G R Y - - - - - - -
TAA------------------------TATTGCCAAAGTACATTCTCCAAA---------------------
817818819820821822823824825826827828829830831832833834835836837838839840
S Q K N I P A V G F S V G V E R I M S I I E K K
- - - - I P A V G F S V G V E R I M S I - - - -
------------AGCAAGTTGAGAAACTGTCATACTGAAACCTTTTGTAAAGGCTCTTGC------------
841842843844845846847848849850851852853854855856857858859860861862863864
F E A C K T H N H S S K G S F T D V L I C N V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
D S F L E Y R F K I A S L L W D N H I S C E I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
L T G N G K L R K Q L D Y A S N N N I P Y C I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
I G E S E A L K E T V Q F K F I H N N Q S E T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
T E Q T T S V S S Q E V H I N D L V P H I Q S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961962963964965966967968969970971972973974975976977
I L Q F G S T Y S K F S S E F K M
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_his_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L P V V E L G G T S L T L E S F Y N V C Y C R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A P I V L D A S V F A A F L P A P E N P V P R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Y H Y A T L F S G K Y R S V P Y V L S R A Y I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F T M L S L L A S S P A S V S I T V L Q G L T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I L N G P K D I A L Q R P E C V L L P N S A L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K D L L D Q L L S I L T E G P D N P F Y I E L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D E D I N I F K L N A H A F T L S V S F A S S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L S F V A T L H E A A L S F S F E L M C A R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R E L F D F V N Y T V Q R K H S G M K A A M S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V M S L I S G S K K V T Q K G S N L F C S Q S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S L A G E I R E L A T E L R T A V R P D T A S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A Y T S L D T R P L T D V T T L S L L H G V Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K I A T I R S L S I A R R H L V D A V V V E K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I W K A P S D D A Y G V A E S E M L D A L K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P V P V L H A L L L P V Q L C G V L K D L S T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L L S A F T K L S I A Q A G L S K G K I Q V G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G V L I A M D T Y G D L F R E C Q S A S G A H Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F W C I S R I V R A M T D H L F L A I S N A R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P Q P P C G M R D L L P G Q M V L R Q A A L S L
- - - - - - - - - - - - - - - - L R Q A A L S L
------------------------------------------------CTTAGGCAAGCTGCTCTTTCACTG
457458459460461462463464465466467468469470471472473474475476477478479480
I T S V F Q Q H G A V C I E T P V M E S R S V L
I T S V F Q Q H G A V C I E T P V M E - - - - -
ATAACGAGCGTATTTCAACAACATGGCGCCGTCTGCATAGAGACCCCAGTCATGGAA---------------
481482483484485486487488489490491492493494495496497498499500501502503504
M G K Y G E E Q K L I Y N V S D Y G E E P L S L
- - - - - - - - - - - - - - - - - - - - - - S L
------------------------------------------------------------------TCTCTT
505506507508509510511512513514515516517518519520521522523524525526527528
R Y D L T V P F A R Y C A T H R E K S I K R Y S
R Y D L T V P F A - - - - - - - - - - I K R Y S
CGGTATGATTTAACGGTCCCGTTTGCG------------------------------ATTAAGCGCTATTCC
529530531532533534535536537538539540541542543544545546547548549550551552
I G R V Y R R D K P V M E K G R F R E F Y Q C D
I G R V Y R R - - - - - - - - - - R E F Y Q C D
ATCGGGCGCGTTTACAGACGA------------------------------CGTGAGTTTTATCAATGCGAT
553554555556557558559560561562563564565566567568569570571572573574575576
L D I V Y E P N T Q A P M A A D A E V V V I V F
L D I V - - - - - - - - - - - D A E V V V I V F
CTGGATATTGTC---------------------------------GACGCTGAGGTCGTAGTTATTGTATTT
577578579580581582583584585586587588589590591592593594595596597598599600
E I L H A L R K S I R N F E I L I N H R G I L D
E I L H - - - - - - - - - - - - - - - - - - - -
GAGATTCTGCAT------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
S A M A V A G V S D E Q K K A V C S C I D Q L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
K H S K E E V R D K I V K S K G L T P V V A D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
V L A L I D F K L P T S P H M F A N S P F D F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S T A I A A L K E L H A S I S L D S T L S S Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
I D A I S P R L E Q L G L L F R Y A S L M C P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
S L E Y M V L D F S L A R G L D Y Y T G M V F E
- - - - - - - - - - - - - - - - - - - - - V F E
---------------------------------------------------------------GTTTTCGAA
745746747748749750751752753754755756757758759760761762763764765766767768
A K L I S D H G E R T G S I A G G G R Y D E L L
A K L - - - - - - - - - S I A G G G R Y - - - -
GCAAAGCTG---------------------------TCGATAGCAGGAGGGGGACGTTAT------------
769770771772773774775776777778779780781782783784785786787788789790791792
G K F R A R G D E L C A V G G S I G I E R I F A
- - - - - - - - - L C A V G G S I G I E R I F A
---------------------------CTTTGCGCAGTCGGGGGAAGCATAGGGATAGAACGCATATTTGCC
793794795796797798799800801802803804805806807808809810811812813814815816
I L E A R Q A S L D G L A T G D V E D G G S S C
I - - - - - - - - - - - - - - - - - - - - - - -
ATT---------------------------------------------------------------------
817818819820821822823824825826827828829830831832833834835836837838839840
K L A S A K R Y D V Y I C G A P G C T I E A R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
841842843844845846847848849850851852853854855856857858859860861862863864
E V A G I L W G L G I S V G M S C K E G C S Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
865866867868869870871872873874875876877878879880881882883884885886887888
L L K K D I D E G V A G H A L L A L I I G G D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
889890891892893894895896897898899900901902903904905906907908909910911912
I E N R V I N V K N L S T T E Q V V V P F D E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
913914915916917918919920921922923924925926927928929930931932933934935936
G E Y C A K A L A T R H E R F A L S E C E K L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
937938939940941942943944945946947948949950951952953954955956957958959960
R D V K D G K E V R E G I D N I L A A I K M L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
961
T
-
---
Class II
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_his_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_his_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K L Q N L R G M V D L L P E H T P L W Q F I
- - - - - - - - - - - - - - - - - - - L W Q F I
---------------------------------------------------------TTATGGCAGTTTATT
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E E T A R T H F R R S G V N E I R T P L L E P T
E E T A R T H F R R S G V N E I R T P L L E - -
GAAGAAACTGCCCGTACCCACTTTAGGCGTTCTGGAGTAAACGAAATACGTACACCTTTACTTGAA------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E L F A R G I G E S T D V V N K E M Y S F F D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G D R S C T L R P E G T A S I V R A A L Q H N L
- - - - - T L R P E G T A S I V - - - - - - - -
---------------ACTTTACGTCCAGAAGGCACTGCTTCGATAGTA------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L A Q G P Q R F W Y S G P M F R Y E R P Q A G R
- - - - - Q R F W Y S G P M F R Y - - - - - - -
---------------CAACGATTTTGGTATAGTGGACCCATGTTCCGTTAT---------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q R Q F H Q I G L E L H G Y S D P R S D V E A I
- R Q F H Q I G L E L H - - - - - - - D V E A I
---AGGCAGTTTCACCAAATTGGTTTAGAATTGCAT---------------------GATGTTGAAGCTATT
145146147148149150151152153154155156157158159160161162163164165166167168
S I A W D L L M D L G V K R L A L E L N T L G S
S I A W D L L M - - - - - - - - - - - - - - - -
TCTATTGCATGGGATTTGTTAATG------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I S D R I L Y R Q K L E T W L S D H F N E L D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D S R A R V S S N P L R I L D S K I P S T K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L K K A P L L S N E L S A E S S E R F A A V R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G L A N L G I P F K I N P Y L V R G L D Y Y S H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T A F E I I S D Q L G A Q S T V C G G G R Y D G
- A F E I I S - - - - - - - T V C G G G R Y - -
---GCTTTTGAAATCATTAGT---------------------ACTGTTTGCGGGGGAGGCCGTTAT------
289290291292293294295296297298299300301302303304305306307308309310311312
L V E Q L G G H N T P A I G W A L G V E R L V L
- - - - - - - - - T P A I G W A L G V E R L . L
---------------------------ACACCAGCAATTGGCTGGGCTTTGGGAGTTGAGCGTCTT---CTG
313314315316317318319320321322323324325326327328329330331332333334335336
L I M Q G N I P I K I P S P D F Y I I N K G K V
L I - - - - - - - - - - - - - - - - - - - - - -
CTAATC------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A E A I A L T L A R Q L R N S G M I V E L D C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K S A F S K Q F K R A D R S N A L Q A I I L G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E E V A R N Q I R I K N L R T N I S N R S L N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422
E D F L D N S K F S I L Y C
- - - - - - - - - - - - - -
------------------------------------------
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_lys_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L V M E L N D L Q A Q R A A K L E Q L R A A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L D P Y P P R C R R S H T I G Q V L A A F D E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A A G E A V V T L A G R I I G A R R V M G K I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F A H I E D G T G E I Q L W L S R A D L G D E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F E R F R D Q I D T F D I V Q A T G T L R R T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T G E R S L F V R E M A V L A K A I N P P P E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
W A G L Q D V E E R H R Q R Y L D L I V N R E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R D I F R A R A Q V M S T M R R V L D D R G F L
- - - - - A R A Q V M S T M R R V L D D R G F L
---------------GCCCGTGCGCAGGTGATGAGCACGATGCGGCGCGTGCTTGACGATCGCGGCTTTCTT
193194195196197198199200201202203204205206207208209210211212213214215216
E V E T P V L Q P I Y G G A A A R P F V T Y H N
E V E T P V L Q - - - - - - - - - - - - - - - -
GAGGTCGAGACACCGGTTTTGCAA------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A L G Q N L Y L R I A T E L Y L K R L I V G G F
- - - - - - Y L R I A T E L Y L K - - - - - - -
------------------TATCTCCGGATCGCCACAGAACTCTACCTCAAG---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P G V Y E I G K N F R N E G V D R S H N P E F T
P G V Y E I G K N F R N - - - - - - - - P E F T
CCCGGCGTGTATGAGATCGGTAAAAACTTTCGCAAC------------------------CCTGAGTTTACG
265266267268269270271272273274275276277278279280281282283284285286287288
M M E C Y Q A Y A D Y H A M M T L V E E M L G E
M M E C Y Q A - - - Y H A M M T L V E E M L G -
ATGATGGAGTGTTATCAGGCG---------TATCACGCCATGATGACCCTCGTCGAAGAGATGTTGGGT---
289290291292293294295296297298299300301302303304305306307308309310311312
I C L A V H G T T T I S Y Q G R E L D L R P P W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P R I A M A D A I V E R T G I D I T R H T D L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S L H A A I A D R G L R V D R K T S W A K Q V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E L F S E F V Q P H L F Q P T F I I D Y P V A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S P L A K R I P G R P D F T E R F E A F I A G M
- - - - - - - - - - - - - - - R F E A F I - - -
---------------------------------------------CGCTTTGAGGCGTTTATC---------
409410411412413414415416417418419420421422423424425426427428429430431432
E I G N A F T E L N D P F D Q E E R F R E Q L R
E I G N A F T E - - - - - - - - - - - - - - - -
GAGATCGGGAATGCGTTTACCGAG------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A F A A G D E E A H Q M D E D F I N A L R Y G M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P P T G G L G I G I D R L V M V L T D Q A S I R
P P T G G L G I G I D R L V M V - - - - - - - -
CCGCCAACCGGTGGTCTTGGTATCGGGATCGATCGGTTGGTGATGGTT------------------------
481482483484485486487488489490491492493494495496
E V I L F P H L R E R L E G R G
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_lys_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F D N I L E Q Q R I E K A K E L K N L G I N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y P H F L E K E M S L K T F K D K F S Y I L E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V E K R D E S V N A V V A G R L K L L R I A G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S I F A N I E D E D T N L Q I Y F S K D S V G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L Y T I L K K N L E V G D I V L V K G F P F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T K T G E F S L H A S E V K L A T K A I V P L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E K Y H G L T D I E Q R Y R K R Y V D M I M N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E V R K D F L V R S K V V S L I R H F F E N K G
- - - - - - - V R S K V V S L I R H F F E N K G
---------------------GTGCGTTCTAAAGTGGTGAGTTTAATCCGTCATTTTTTTGAAAATAAAGGC
193194195196197198199200201202203204205206207208209210211212213214215216
F L E V E T P M M H P I A G G A N A K P F V T F
F L E V E T P M M H - - - - - - - - - - - - - -
TTTTTAGAAGTAGAAACTCCTATGATGCAT------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H N S L G V E R F L R I A P E L Y L K R L I V G
- - - - - - - - F L R I A P E L Y L K - - - - -
------------------------TTTTTAAGAATTGCTCCAGAACTTTATCTTAAA---------------
241242243244245246247248249250251252253254255256257258259260261262263264
G F E A V F E I N R C F R N E G M D L T H N P E
- - E A V F E I N R C F R N - - - - - - - - P E
------GAGGCGGTTTTTGAAATCAATCGTTGTTTTAGAAAC------------------------CCCGAA
265266267268269270271272273274275276277278279280281282283284285286287288
F T T I E F Y W A Y H N Y K D L M D L T E E L F
F T T I E F Y W A - - - Y K D L M D L T E E L F
TTTACAACTATAGAATTTTATTGGGCC---------TATAAAGATTTAATGGATTTAACCGAAGAACTTTTT
289290291292293294295296297298299300301302303304305306307308309310311312
A L L L D K L N L G K T I E F D G K M I N F S K
A - - - - - - - - - - - - - - - - - - - - - - -
GCT---------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P F E R I T Y K D A L C K Y G G L D R D L I E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K E K I L T K L K A D G F E A N E K L E L G H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
Q A E L F D N Y V E E K L I N P T F V I D F P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S I S P L S R R S D E D S Q I A E R F E L F I C
- - - - - - - - - - - - - - - - - R F E L F I -
---------------------------------------------------AGATTTGAGTTGTTTATT---
409410411412413414415416417418419420421422423424425426427428429430431432
G R E L A N G F N E L N D P L D Q Y E R F L K Q
- - E L A N G F N E L N D P L D Q Y E R F L K Q
------GAATTGGCAAATGGTTTTAATGAGCTTAATGATCCTCTTGATCAATATGAGAGATTTTTAAAACAA
433434435436437438439440441442443444445446447448449450451452453454455456
I E A K N A G D E E A C E M D E D F V N A L G Y
I E - - - - - - - - - - - - - - - - - - - - - -
ATTGAA------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G M P P T A G Q G I G I D R L V M L L T N K K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501
I R D V I L F P A M R P L K S E L K E K E
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_lys_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T E P I Q P Q A A V A A D E N Q I V A E R R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K L R A L R D Q G I A Y P N D F Q P T H H A A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L Q T A Y A D A D K E A L E A K S L E V A I A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R M M L K R V M G K A S F A T V Q D G S G Q I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F F V T P A D V G A E T Y D A F K K W D L G D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V A A R G V L F R T N K G E L S V K C T Q L R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L A K A L R P L P D K F H G L A D Q E T R Y R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R Y V D L I V T P E T R T T F R A R T K A I A S
- - - - - - - - - - - - - - - - A R T K A I A S
------------------------------------------------GCGATGAAACGGTTGCGCGAGATC
193194195196197198199200201202203204205206207208209210211212213214215216
I R K F M G D A D F M E V E T P M L H P I P G G
I R K F M G D A D F M E V E T P M L H - - - - -
GAGCTCGCGGCCCTGGTACTGGATCGTCGCGGTGCCGAGCGCGTCCACGGCCGCCTG---------------
217218219220221222223224225226227228229230231232233234235236237238239240
A A A K P F V T H H N A L D M E M F L R I A P E
- - - - - - - - - - - - - - - - - F L R I A P E
---------------------------------------------------CATCGTGAATTCCGGATTGTG
241242243244245246247248249250251252253254255256257258259260261262263264
L Y L K R L I V G G F E R V F E I N R N F R N E
L Y L K - - - - - - - E R V F E I N R N F R N -
GCGCGGCGACAC---------------------GTTGATCTCGAACACGCGCTCGAAGCCGCCGACGAT---
265266267268269270271272273274275276277278279280281282283284285286287288
G V S P R H N P E F T M M E F Y A A Y T D Y R W
- - - - - - - P E F T M M E F Y A A - - - Y R W
---------------------CGCGATGCGCAGGAACATTTCCATGTCGAGCGC---------CGTGACGAA
289290291292293294295296297298299300301302303304305306307308309310311312
L M D F T E R L I R Q A A V D A L G T A T I Q Y
L M D F T E R L I R - - - - - - - - - - - - - -
CGGCTTCGCGGCCGCGCCGCCCGGGATCGG------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q G R E L D L A Q P F H R L T I T Q A I Q K Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P S Y T D G Q L S D D A F L R S E L K R L G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V T Q P A F L N A G I G A L Q L A L F E E T A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A Q L W E P T F I I D Y P I E V S P L A R E S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T V A G I T E R F E L F I T G R E I A N G F S E
- - - - - - - R F E L F I - - - E I A N G F S E
---------------------CTGACCCGAGCCGTCCTG---------GAAGCTCGCCTTGCCCATCACGCG
433434435436437438439440441442443444445446447448449450451452453454455456
L N D P E D Q A A R F K K Q V E Q K D A G D E E
L N D P E D Q A A R F K K Q V E - - - - - - - -
CTTGAGCATCATCCGGCCGGCGATCGCGACCTCGAGCGACTTCGCCTC------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A M F F D A D Y I R A L E Y G M P P T G G C G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G I D R L V M L L T D S P T I R D V L L F P H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508
R R E D
- - - -
------------
Class II
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_lys_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D L R A T R L E K A L Q L R E L G F E P Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y R W D C S H S A A Q L Q A L Y A D L P A G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V A V E V A I A G R I M A R R V F G K L A F F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L Q D E S G Q I Q L Y L E K Q R L S E S M A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D A E A F S H L K A L T D V G D I L G V K G S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R R T E K G E L S I A V D Q Y A I L T K S L Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L P D K W H G L T D V E K R Y R Q R Y V D L I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N P E V R E T F R R R A K I T A A I R R H L E D
- - - - - - - - - R R A K I T A A I R R H L E D
---------------------------CGCTGCCAACACCAGTTCCGCCATCGTTGCCCGTTTCCACGGTGG
193194195196197198199200201202203204205206207208209210211212213214215216
Q G F I E I E T P V L Q A E A G G A E A R P F I
Q G F I E I E T P V L Q - - - - - - - - - - - -
CGCCAGATCGATCGTCTGACCTTGGTAGGGCACTTG------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T Y H N T L E L D L Y L R I A T E L H L K R L I
- - - - - - - - - - Y L R I A T E L H L K - - -
------------------------------GTAGTCGGCATAGGCCTGATAGACCTCGATCGA---------
241242243244245246247248249250251252253254255256257258259260261262263264
V G G F E K V F E L G R I F R N E G I S T R H N
- - - - E K V F E L G R I F R N - - - - - - - -
------------GGTTGAAATGCCCTCGTTGCGGAAAATGCGCCCTAG------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P E F T S I E V Y Q A Y A D Y E D M M R L T E T
P E F T S I E V Y Q A - - - Y E D M M R L T E T
GACAATTAGGCGCTTGAGGTGCAACTCGGTTGC---------ATAAAGGTCGAGTTCTAAGGTGTTGTGGTA
289290291292293294295296297298299300301302303304305306307308309310311312
L I A Q V A E Q V V G S L Q V P Y Q G Q T I D L
L I A - - - - - - - - - - - - - - - - - - - - -
AGTGATGAA---------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A P P W K R A T M A E L V L A A T G I D F E S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K D L E A G I A A V K A A G I P V P E D C P N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G K L L N H C F E E K V E A T L I Q P T F V I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y P V E I S P L A K P H R S K P G L V E R F E L
- - - - - - - - - - - - - - - - - - - - R F E L
------------------------------------------------------------GAAAGCTTCGGC
409410411412413414415416417418419420421422423424425426427428429430431432
F I V G R E T A N S F S E L T D P V D Q R Q R L
F I - - - E T A N S F S E - - - - - - - - - - -
ATCGAT---------CGATTCACTGAGCCGCTGCTTCTC---------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E A Q A A D K A A G N V E A N D V D E D F L L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L E H G M P P T G G L G I G I D R L V M L L T D
- - - - - P P T G G L G I G I D R L V M L - - -
---------------TGGCAAGTCAGCATAGAGCGCTTGGAGCTGCGCGGCACTATGGCTACA---------
481482483484485486487488489490491492493494495496497498499500501502503504
S P S I R D V I A F P L L R P E A S S E E A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_lys_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N I L E L S E Q E I I R R N S L N E L R A M G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I E P Y P A A E Y V T N A F S T D I K A E F K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D E T P R Q V S V A G R M M S R R I M G K A S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I E L Q D S K G R I Q V Y I T R D D I C P G E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K E M Y N T V F K R L L D L G D F I G I E G F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F R T Q M G E I S I H A Q K L T V L A K S I K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L P I V K Y K D G V T Y D S F E D P E L R Y R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R Y V D L A V N E G V K D I F I K R S K V Y S S
- - - - - - - - - - - - - - - - K R S K V Y S S
------------------------------------------------AAACGCAGCAAAGTATACAGTTCC
193194195196197198199200201202203204205206207208209210211212213214215216
M R E Y F N S K G Y M E V E T P I L Q A I A G G
M R E Y F N S K G Y M E V E T P I L Q - - - - -
ATGCGCGAATACTTCAACTCAAAGGGATACATGGAAGTGGAAACTCCGATCCTGCAG---------------
217218219220221222223224225226227228229230231232233234235236237238239240
A A A R P F M T H H N A L D I P L Y M R I A S E
- - - - - - - - - - - - - - - - - Y M R I A S E
---------------------------------------------------TACATGCGAATCGCCAGTGAG
241242243244245246247248249250251252253254255256257258259260261262263264
L Y L K R L I V G G F E G V Y E I G K N F R N E
L Y L K - - - - - - - E G V Y E I G K N F R N -
CTTTACCTGAAA---------------------GAAGGTGTATACGAGATCGGTAAAAACTTCCGTAAC---
265266267268269270271272273274275276277278279280281282283284285286287288
G M D R T H N P E F T C M E I Y V A Y K D Y N W
- - - - - - - P E F T C M E I Y V A - - - Y N W
---------------------CCAGAATTCACCTGTATGGAGATATATGTAGCC---------TACAATTGG
289290291292293294295296297298299300301302303304305306307308309310311312
M M E F T E K M I E K I C L D V N G T T E V K V
M M E F T E K M I E - - - - - - - - - - - - - -
ATGATGGAATTTACTGAAAAAATGATCGAA------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G D N I I N F K A P Y K R V T M L G A I K E H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G Y D L T G M N E E Q I R E V C K K L N M E I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D T M G K G K L I D E I F G E F C E G T Y I Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T F I T D Y P I E M S P L T K K H R D N P E L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E R F E L M V N G K E L C N A Y S E L N D P I D
- R F E L M V - - - E L C N A Y S E - - - - - -
---CGTTTCGAGTTGATGGTA---------GAGTTGTGTAACGCATATTCTGAG------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q L E R F E D Q M K L S E K G D D E A M I I D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D F V R A L E Y G M P P T S G M G I G M D R L T
- - - - - - - - - - P P T S G M G I G M D R L T
------------------------------CCTCCTACTTCGGGTATGGGTATTGGTATGGACCGTCTGACT
481482483484485486487488489490491492493494495496497498499500501502503504
M L M T G Q S T I Q E V L F F P Q M R P E K V V
M L - - - - - - - - - - - - - - - - - - - - - -
ATGCTG------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P K D S A S K F M E L G I A E E W V P V I Q K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G Y N Q V A D M K E V N P Q K F H Q D I C G I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575
K K Y K L E L T N P S V N D V A E W I Q K I K
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Bacteria/Thermus thermophilus/amino acid sequences/Tthermophilus_lys_aa
Bacteria/Thermus thermophilus/nucleotide sequences/Tthermophilus_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N D Q T R Q R L L N L E A L V E A G F A P Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y R F P K T H S A E A I L K A K R G A P P E S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W P E E E V A V A G R L V A L R R M G K V T F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H L L D E T G R I Q L Y F Q R D L T P K Y E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K K L D V G D I L G V R G H P F T T K T G E V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V K V L D W T P L V K S L H P L P D K W H G L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D K E V R Y R Q R Y L D L I V N P E V R E V F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R R S E I V R Y I R R F F E A K G F L E V E T P
R R S E I V R Y I R R F F E A K G F L E V E T P
GTCAAAGGGAAGGCCCGCCTTCTCCTTCAGGGCCTCCACGAAGGAGATGCGCCTGAAGGGCGGCTTGAAGTT
193194195196197198199200201202203204205206207208209210211212213214215216
I L Q P T T G G A E A R P F K T Y H N A L D H E
I L Q - - - - - - - - - - - - - - - - - - - - -
CAGCACCCG---------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F Y L R I S L E L Y L K R L L V G G Y E K V F E
- Y L R I S L E L Y L K - - - - - - - E K V F E
---CAGGCCCGCCATGTCCTGGTAGTCGGCGTAGGC---------------------GAACTCGGGGTTGTG
241242243244245246247248249250251252253254255256257258259260261262263264
I G R N F R N E G I D H N H N P E F T M L E A Y
I G R N F R N - - - - - - - - P E F T M L E A Y
GTTGTGGTCAATGCCCTCGTT------------------------GACCTTCTCGTACCCCCCGACGAGGAG
265266267268269270271272273274275276277278279280281282283284285286287288
W A Y A D Y Q D M A G L V E E L L S G L V L H L
W A - - - Y Q D M A G L V E E L L S - - - - - -
GCGCTT---------CTCCAAGGAGATGCGGAGGTAGAACTCGTGGTCTAGGGC------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F G S H E V P Y Q G R V L N F K P P F R R I S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V E A L K E K A G L P F D P L D L E R L R L W A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D A H H P E L S Q V P N Y K L L D K L F G I Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E P E L Q D P T F V F D F P L A I S P L A K R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R E K P G L V E R W D L Y A G G M E L A P C Y S
- - - - - - - - R W D L Y A - - - E L A P C Y S
------------------------CACGTCCAGCTTCTTGAG---------TTTGGGCGTGAGGTCCCTCTG
409410411412413414415416417418419420421422423424425426427428429430431432
E L N D P L D Q R E R F L E Q A R R R K E G D E
E - - - - - - - - - - - - - - - - - - - - - - -
GAA---------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E A P E P D E D F L L A L E Y G M P P A A G L G
- - - - - - - - - - - - - - - - - P P A A G L G
---------------------------------------------------GGGGGCGCCCCGCTTGGCCTT
457458459460461462463464465466467468469470471472473474475476477478479480
L G I D R L A M L L T D Q P S L R D V L L F P L
L G I D R L A M L - - - - - - - - - - - - - - -
GAGGATGGCCTCGGCGCTGTGGGTCTT---------------------------------------------
481482483484485486487488489490491492
L K P K K E A V E E G V
- - - - - - - - - - - -
------------------------------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_lys_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E L N D L Q Q T R Y G K L Q A L Q A A G I E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y P A R V P Q R T H T L T A V R E Q F S A L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A N A T V T I M G R L R Q R R V M G K S A F A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L N D D H G A F Q I F L S K A D V G D E P F K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F V D L T D L G D I I A V T G T L F T T K M G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P S V H V T S W T M L S K A I T P P P D K R E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q F S D Q E A R Q R Q R Y V D L S A N P E V R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I F R I R A R L I T A M R R Y L D E R G F L E V
- - - I R A R L I T A M R R Y L D E R G F L E V
---------TTTTTCAAAAATGGCATCGCGCATGGTCAAGCGCTGCCACGAACCGCCAAGCTCGATCTGATG
193194195196197198199200201202203204205206207208209210211212213214215216
E T P V L Q G I Y G G A A A R P F T T H H N Q L
E T P V L Q - - - - - - - - - - - - - - - - - -
CCCTTGGTATTCGATGCT------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H Q D L Y L R I A T E L Y L K R L I V G G F D G
- - - - Y L R I A T E L Y L K - - - - - - - D G
------------ATAATCGCCGTAGGCTTGATAGACCTCGATCAT---------------------GCGATC
241242243244245246247248249250251252253254255256257258259260261262263264
V Y E I G K N F R N E G V D R T H N P E F T M I
V Y E I G K N F R N - - - - - - - - P E F T M I
AACGCCTTCGTTGCGGAAGTTTTTGCCAAT------------------------AACGATCAAGCGCTTCAA
265266267268269270271272273274275276277278279280281282283284285286287288
E V Y Q A Y G D Y E S I M Q L T E G M I R F A A
E V Y Q A - - - Y E S I M Q L T E G M I R - - -
ATAGAGCTCGGTGGC---------GTATAAATCTTGGTGCAATTGATTATGATGGGTGGTGAA---------
289290291292293294295296297298299300301302303304305306307308309310311312
E Q I F N S T S I E Y Q G H Q I E L G G S W Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L T M R D A I F E K T G V D I R E C R E F D T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
W E A I G E A G L K I E R K P T W A K Q V D E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F S E F V E P E L I Q P T F I T E Y P Q P L S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L A K R K A D D P Q F V E R F E L F M L G A E I
- - - - - - - - - - - - - R F E L F M - - - E I
---------------------------------------ATGCTTGAATGGCTCATC---------GGCTTT
409410411412413414415416417418419420421422423424425426427428429430431432
A N A F S E L N D P F D Q E Q R F L E Q G R D Y
A N A F S E L N D P F D Q E Q R F L E Q G R - -
GCTGAGGAAAATTTGAAACGCGCCATGATCATCATTTAAATGGGCGAACGCTGATTTGCCCATAAC------
433434435436437438439440441442443444445446447448449450451452453454455456
A A G D D E A M Q M D E D Y L E A L K V G M P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T G G L G I G I D R L C L L F T N Q T T I R E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492
I F F P H L R K Q G E E
- - - - - - - - - - - -
------------------------------------
Class II
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_lys_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L K E F K E Q R L K E I Q E L R S M G I E P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P Y K F E K E L T A R E I R E K Y D Y L Q A G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L E S E K L S F A G R V M S I R H H G K T A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F H M K D D T G R I Q A Y I K A D S V G K E K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D L F K R H V K I G D F V G V R G F P F K S K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G E L T I Y V Q E Y T L L S K A L R P L P E K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
H G I K D K E I I Y R Q R Y L E L I V N D E A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E R F K K R F K A V R V I R E F L N S R G F I E
- - - - K R F K A V R V I R E F L N S R G F I E
------------ATCTTCGAGGATGTCCACCCCGAGTTTTTCTTTGAGAAAGTCTCTCATTCTCACTCTTTT
193194195196197198199200201202203204205206207208209210211212213214215216
V E T P I L H Y V T G G A E A R P F V T H L N V
V E T P I L H - - - - - - - - - - - - - - - - -
CCAGGGTGGTGTGAAGTCTAT---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F D I D M Y L R I A P E L Y L K R L I V G G F E
- - - - - Y L R I A P E L Y L K - - - - - - - E
---------------TTCAGTGAGATCCATCATATCGTTGTAATCCGC---------------------GCT
241242243244245246247248249250251252253254255256257258259260261262263264
K I Y E I G K N F R N E G I S Y K H S P E F T S
K I Y E I G K N F R N - - - - - - - - P E F T S
GGTGAACTCGGGACTGTGTTTGTAAGATATTCC------------------------CTCGTATATCTTTTC
265266267268269270271272273274275276277278279280281282283284285286287288
I E I Y Q A Y A D Y N D M M D L T E E L I V E V
I E I Y Q A - - - Y N D M M D L T E E L I V - -
AAAACCGCCGACGATCAA---------GTAAAGCTCCGGTGCGATTCTCAAATACATATCGATATC------
289290291292293294295296297298299300301302303304305306307308309310311312
V K R T C G T L K I S Y Q G K E I D F T P P W K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R V R M R D F L K E K L G V D I L E D P D E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L K K L E E H G V E L E I K N R A H L I D K L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D L V E E E L V N P T F I I D H P V V I S P L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K R H R E D P R L T E R F E L I I F G R E I A N
- - - - - - - - - - - R F E L I I - - - E I A N
---------------------------------AAAGTCACCTATTTTGAC---------GAAGAGATCCAT
409410411412413414415416417418419420421422423424425426427428429430431432
A F S E L N D P V D Q Y Q R F L E Q A K M R E E
A F S E - - - - - - - - - - - - - - - - - - - -
CTTTTCCTTCCC------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G D E E A H M M D L D F V R A L E Y G M P P T G
- - - - - - - - - - - - - - - - - - - - P P T G
------------------------------------------------------------TTCAAGAACTTC
457458459460461462463464465466467468469470471472473474475476477478479480
G L G I G L D R L F M F I T D S P T I R D V I P
G L G I G L D R L F M F - - - - - - - - - - - -
TCCAGCTTGAAGATAGTCGTACTTTTCCCTTATTTC------------------------------------
481482483484485486487488489490491492493494495496497498499500501502
F P I V K P K K F E E E E A E F E G G F E E
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_lys_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P E E T S D L A E V R L Q K L Q Q I E A L G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D P W G Q R F D N A Q P I G D I R Q L P A E N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D E T K P G P K V R A A G R V V R Y R T G G K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L F L E I W D Q T G R V Q L M I R V N K V T P Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E W Q V A Q L L D L G D L V G V D G E F G K T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T G E L T I Q V E K L T F L T K S L E P H P K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V F G M G D I E F R L R H R Y L D M I Y T P D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L R R A H Q R V K I I R T I R T H L D A Q G Y M
- - - - - Q R V K I I R T I R T H L D A Q G Y M
---------------GCCGACGTGTTCGTGGAACAGGTCCGCGTACTTCGCGCGCTGGAACGGCGGCTCGAA
193194195196197198199200201202203204205206207208209210211212213214215216
E V E T P T L H A I A G G A A A R P F E T H H N
E V E T P T L H - - - - - - - - - - - - - - - -
GTTCACCGTCTTCTCGCCGAACGG------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A L D I D L F V R I A L E L P L K R L L V G G I
- - - - - - F V R I A L E L P L K - - - - - - -
------------------GCTGCGGTAGTCGCCGTAAGCCTGGTACAGTTC---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E K V Y E L G R V F R N E G I S P R H N P E F T
E K V Y E L G R V F R N - - - - - - - - P E F T
GTGTCGCGGGCTGATGCCCTCGTTGCGGAACACCCG------------------------CCCGCCGACCAG
265266267268269270271272273274275276277278279280281282283284285286287288
M L E L Y Q A Y G D Y R S M M D L T E G L I V A
M L E L Y Q A - - - Y R S M M D L T E G L I V -
TAGGCGCTTCAGGGGCAGTTC---------GCGCACGAACAGATCGATGTCGAGCGCGTTGTGGTGCGT---
289290291292293294295296297298299300301302303304305306307308309310311312
C V D I L G G G R T I P F G E K T V N F E P P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Q R A K Y A D L F H E H V G C D M T D E V A V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A A A R A E N I E L E M A P T K G A P K V A K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H V V L V Q E L F E D L V E E K L V G P V F V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D Y P S P L C P L T K R K R E N P A I A E R F E
- - - - - - - - - - - - - - - - - - - - - R F E
---------------------------------------------------------------CGTGACCTT
409410411412413414415416417418419420421422423424425426427428429430431432
L Y V H G M E L A N A Y T E L N D P I T Q E Q T
L Y V - - - E L A N A Y T E L N D P I T Q E Q T
GTTCACGCG---------CTGCACGCGCCCGGTCTGGTCCCAGATTTCGAGGAACAGGAGCTTCCCGCCGGT
433434435436437438439440441442443444445446447448449450451452453454455456
F T Q Q L A G L S D E D S M A K M D H D F I R A
F T Q Q L A - - - - - - - - - - - - - - - - - -
GCGGTAGCGCACCACGCG------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L R H G M P P A G G L G I G I D R L V M L L T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498
T Q T I R D V I L F P L L R P E A K
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_lys_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M N Q K L S E Q E L I R R Q K I E K L Q K L G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E V F H E T V K F D L N I N K I I Q K Y N S F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K D E L A K D E F S L S T T G R I I T I R S S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L V L K S Q G S K F Q I Y L P I K E L D K K Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L I D L L D I G D I I F V N G K L M K T Q T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E L T L R A N E L K L L S K S L K V L P D K F H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G L N D I E E R Y R H R Y V D L I V N D D V R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T F L L R S R I I S L I R K Y F D N L E Y L E V
- - - L R S R I I S L I R K Y F D N L E Y L E V
---------TTAAGAAGTAGAATTATTTCTTTAATAAGAAAATATTTTGACAACCTAGAATATTTAGAAGTT
193194195196197198199200201202203204205206207208209210211212213214215216
D T P V L Q P I L G G A S A K P F I T K F N A L
D T P V L Q - - - - - - - - - - - - - - - - - -
GATACTCCTGTTTTACAA------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N S N F Y L R I A T E L P L K K L V V G G F D R
- - - - Y L R I A T E L P L K - - - - - - - D R
------------TATTTAAGAATTGCAACAGAACTACCACTTAAA---------------------GATAGA
241242243244245246247248249250251252253254255256257258259260261262263264
V Y E I G R I F R N E G V D T T H N P E F T S I
V Y E I G R I F R N - - - - - - - - P E F T S I
GTTTATGAGATTGGAAGAATTTTCAGAAAT------------------------CCTGAATTTACCTCAATT
265266267268269270271272273274275276277278279280281282283284285286287288
E Y Y E A Y S N N E G M M N R T E D L F K F I A
E Y Y E A - - - N E G M M N R T E D L F K - - -
GAATATTATGAAGCA---------AATGAAGGAATGATGAATCGAACAGAAGATTTATTTAAA---------
289290291292293294295296297298299300301302303304305306307308309310311312
K E L N L K T I F F N G Y E I D L N K P F R R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N M V E A L N E K L G I D L Y K I S F E D A K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L A K K H H I K V E S Y F K I G H I I N E L F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L F I E K D L I Q P T F V Y G H P I E I S P L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
N K N K K N P N F T D R A E L F I G T K E Y A N
- - - - - - - - - - - R A E L F I - - - E Y A N
---------------------------------CGTGCCGAACTGTTTATC---------GAATATGCTAAT
409410411412413414415416417418419420421422423424425426427428429430431432
M F T E L T D P I D Q L E R F K D Q Q N E K D N
M F T E - - - - - - - - - - - - - - - - - - - -
ATGTTTACAGAA------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G N E E A N E I D Y D F V E A L E Y G L P P T G
- - - - - - - - - - - - - - - - - - - - P P T G
------------------------------------------------------------CCTCCAACAGGT
457458459460461462463464465466467468469470471472473474475476477478479480
G C G I G I D R L V M L F T N N E S I R E V L L
G C G I G I D R L V M L - - - - - - - - - - - -
GGATGTGGAATTGGTATTGATAGATTAGTGATGTTA------------------------------------
481482483484485486487
F P H L K N K
- - - - - - -
---------------------
Class II
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_lys_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M M S H E E H N H E E L N D Q L Q V R R D K M N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q L R E N G K D P F G Q R F D R T H Q S T D L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E S Y N E F S K E E L E E K A I E V T I A G R M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M T K R G K G K A G F A H I Q D L K G Q I Q I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V R K D S V G E E Q Y E W F K S S D L G D I V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V T G V M F K T N V G E L S V K A T S F D L L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K A L R P L P D K Y H G L K D I E Q R Y R Q R Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L D L I V N P E S K N T F I T R S K I I Q S M R
- - - - - - - - - - - - - - T R S K I I Q S M R
------------------------------------------CGAAGCAAAATCATTCAATCCATGAGAAGA
193194195196197198199200201202203204205206207208209210211212213214215216
R Y L D D H G Y L E V E T P T M H A I P G G A S
R Y L D D H G Y L E V E T P T M H - - - - - - -
TACTTAGATGACCACGGATACTTAGAAGTTGAAACGCCTACGATGCACGCG---------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A R P F I T H H N A L D M P L Y M R I A I E L H
- - - - - - - - - - - - - - - Y M R I A I E L H
---------------------------------------------ATGAGGATCGCTATCGAGCTCCATTTG
241242243244245246247248249250251252253254255256257258259260261262263264
L K R L I V G G L E K V Y E I G R V F R N E G V
L K - - - - - - - E K V Y E I G R V F R N - - -
AAAAGG---------------------AAAGTCTATGAAATCGGACGTGTATTCCGAAATGAA---------
265266267268269270271272273274275276277278279280281282283284285286287288
S T R H N P E F T M I E L Y E A Y A D Y K D I M
- - - - - P E F T M I E L Y E A - - - Y K D I M
---------------GAATTTACGATGATCGAACTTTACGAAGCTTAT---------AAGGATATTATGAGA
289290291292293294295296297298299300301302303304305306307308309310311312
S L T E N L I A H I A Q E V L G T T T V Q Y G D
S L T E N L I A - - - - - - - - - - - - - - - -
TTGACGGAAAATCTCATTGCTCAT------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y E V D L K P E W K R L H M V D A V K E A T G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D F W K E V S V E E A R A F A K E H G I E I S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
S M S V G H I I N E F F E Q K V E E T L I Q P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F I Y G H P V E I S P L A K K N P E D P R F T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R F E L F I V G R E H A N A F T E L N D P I D Q
R F E L F I - - - E H A N A F T E - - - - - - -
TTTGAGCTGTTTATCGTG---------CACGCGAATGCATTTACTGAATTA---------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K E R F E A Q L K E R E E G N D E A H M M D E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
F V E A L E Y G M P P T G G L G I G I D R L I M
- - - - - - - - - P P T G G L G I G I D R L I M
---------------------------CCTACCGGCGGCCTTGGAATCGGCATCGACAGACTGATTATGCTT
481482483484485486487488489490491492493494495496497498499500
L L T N S P S I R D V L L F P Q M R H R
L - - - - - - - - - - - - - - - - - - -
TTG---------------------------------------------------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_lys_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S Y S I S E Q E L L R R Q K K E E L E A L G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N P Y P S A T F A S N T S T Q D I L S N F N K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P D N F K Q I S I A G R I M G R R I M G A A S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V E L Q D A S G K I Q L Y V H R D T L C P G D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K S F Y N T V F K K L L D I G D L I G I E G Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F T T Q V G E I S I H V N K L T L L S K A L R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L P V V K E D D K Q V Y D A F T D P E Q R Y R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R Y V D L L V T P T T R S I F Q K R T Q M I Q A
- - - - - - - - - - - - - - - - K R T Q M I Q A
------------------------------------------------AAAAGGACTCAAATGATACAAGCC
193194195196197198199200201202203204205206207208209210211212213214215216
I R Q Y L N S Q G Y D E V E T P I L Q P L Y G G
I R Q Y L N S Q G Y D E V E T P I L Q - - - - -
ATTCGTCAGTACTTAAACAGCCAAGGATATGATGAGGTAGAAACACCTATTTTGCAA---------------
217218219220221222223224225226227228229230231232233234235236237238239240
A S A R P F K T H H N T L D M S L Y L R I A N E
- - - - - - - - - - - - - - - - - Y L R I A N E
---------------------------------------------------TATCTTCGTATTGCCAACGAG
241242243244245246247248249250251252253254255256257258259260261262263264
L Y L K R L I V G G Y E G V Y E F A K D F R N E
L Y L K - - - - - - - E G V Y E F A K D F R N -
CTATACTTAAAA---------------------GAGGGCGTATATGAATTTGCAAAAGATTTCAGAAAT---
265266267268269270271272273274275276277278279280281282283284285286287288
G M S R F H N P E F T M L E L Y V A Y K D Y K W
- - - - - - - P E F T M L E L Y V A - - - Y K W
---------------------CCAGAATTTACCATGCTGGAATTGTATGTGGCC---------TACAAATGG
289290291292293294295296297298299300301302303304305306307308309310311312
M M N L T E E L L E Q V A L H L Y G T T A V P V
M M N L T E E L L E - - - - - - - - - - - - - -
ATGATGAATCTTACTGAAGAATTACTAGAA------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G T H T I D F K R P W K R F T M F E A I Q H F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G I D I S Q M E E L E L R K A A A T L S V P L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A S A G K A K I I D E I F G A K C E P N L I Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T F I T D Y P V E M S P L A K Q H R D N P T L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E R F E V I C N G K E I C N A F S E L N D P I E
- R F E V I C - - - E I C N A F S E L N D P I E
---CGGTTTGAAGTCATCTGT---------GAAATCTGTAATGCTTTTTCTGAGTTAAATGACCCTATCGAG
433434435436437438439440441442443444445446447448449450451452453454455456
Q R K R F E E Q L Q L G Q R G D E E A M M L D E
Q R K R F E E Q L Q - - - - - - - - - - - - - -
CAACGTAAACGCTTTGAAGAACAACTTCAA------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D F L R A L S Y G M P P T A G L G I G I D R L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502
M I M T N A P S I Q E V I F F P Q M R P E H
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_lys_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P D A P R P P R P E G L H E Q T I A R L N N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D A Q V D A G F E A Y P Y S Y P Q T H H A R D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F A A H P A R E E G T G E G G T L E P G Q K W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E E S Y S L A G R V T L M R H M G K A A F A D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S D E D G K I Q L F F S K Q D T A G F D A T K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I D L G D I I G V K G H P F V T K T G Q L T L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V T E W Q P L V K S L H P L P S K F H G L Q D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E L R A R R R Y V D L M V T E G A R E K F Q A R
- - - - - - - - - - - - - - - - - - - - - - A R
------------------------------------------------------------------GCCCGC
193194195196197198199200201202203204205206207208209210211212213214215216
S R M I R Y I R N E L D E R G F M E V E G P T L
S R M I R Y I R N E L D E R G F M E V E G P T L
AGCCGCATGATTCGGTACATCCGCAACGAACTGGACGAACGCGGCTTCATGGAAGTGGAGGGGCCCACCCTT
217218219220221222223224225226227228229230231232233234235236237238239240
Q V T A G G A E A R P F M T H H N A L S Y D F K
Q - - - - - - - - - - - - - - - - - - - - - - K
CAG------------------------------------------------------------------AAG
241242243244245246247248249250251252253254255256257258259260261262263264
L R I S L E L Y L K R L L V G G F E R V Y E I G
L R I S L E L Y L K - - - - - - - E R V Y E I G
TTGCGCATCAGCCTGGAACTGTACCTCAAG---------------------GAGCGGGTGTACGAGATCGGG
265266267268269270271272273274275276277278279280281282283284285286287288
R V Y R N E G I D R T H N P E F T M L E L Y W A
R V Y R N - - - - - - - - P E F T M L E L Y W A
CGGGTCTACCGCAAC------------------------CCCGAATTCACCATGCTGGAACTGTACTGGGCC
289290291292293294295296297298299300301302303304305306307308309310311312
Y A D Y S D I A K L V E D L L S G L A K E V H G
- - - Y S D I A K L V E D L L S - - - - - - - -
---------TACAGCGACATCGCCAAGTTGGTCGAAGACCTGCTGAGC------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S Y Q F E Y Q G K T L D F T P P F A R V D Y L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G L R E H V P G L D F D P L D L D R L R A F C D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E R F P Q W K G V P S Y K L L D K L F G E F V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P L L S N P T F V M D H P A V I S P L A K K H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S R P E A V T E R F E V F C S G F E L A N A F S
- - - - - - - - R F E V F C - - - E L A N A F S
------------------------CGTTTCGAGGTGTTCTGC---------GAACTGGCGAATGCGTTCTCC
433434435436437438439440441442443444445446447448449450451452453454455456
E L N D A F D Q R E R F E A Q T A R Q A A G D D
E L N D A F D Q R E R F E A Q T A - - - - - - -
GAACTCAACGACGCCTTCGACCAGCGCGAACGCTTTGAGGCGCAGACTGCC---------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E A H P Q D E D F L L A L E Y G M P P A G G L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I G I D R L A M L L T D S D S I R D V L L F P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525
L R P E G G E A E E A D D T A Q E N T A G
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_lys_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E E M N D Q M L V R R Q K L Q E L Y D L G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D P F G S K F D R S G L S S D L K E E W D Q Y S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K E E L V E K E A D S H V A I A G R L M T K R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K G K A G F A H V Q D L A G Q I Q I Y V R K D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V G D D E F D L W K N A D L G D I V G V E G V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F K T N T G E L S V K A K K F T L L T K S L R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L P D K F H G L Q D I E Q R Y R Q R Y L D L I T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N E D S T R T F I N R S K I I Q E M R N Y L N N
- - - - - - - - - N R S K I I Q E M R N Y L N N
---------------------------AATCGTAGTAAAATCATTCAAGAAATGCGTAATTATTTAAATAAT
193194195196197198199200201202203204205206207208209210211212213214215216
K G F L E V E T P M M H Q I A G G A A A R P F V
K G F L E V E T P M M H - - - - - - - - - - - -
AAAGGTTTCTTGGAAGTAGAAACACCTATGATGCAC------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T H H N A L D A T L Y M R I A I E L H L K R L I
- - - - - - - - - - Y M R I A I E L H L K - - -
------------------------------TACATGCGTATTGCTATTGAGTTGCATTTAAAA---------
241242243244245246247248249250251252253254255256257258259260261262263264
V G G L E K V Y E I G R V F R N E G V S T R H N
- - - - E K V Y E I G R V F R N - - - - - - - -
------------GAAAAAGTATATGAAATTGGTAGAGTATTCCGTAAT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
P E F T M I E L Y E A Y A D Y H D I M D L T E S
P E F T M I E L Y E A - - - Y H D I M D L T E S
CCTGAATTCACAATGATTGAATTATATGAAGCA---------TATCATGACATTATGGATTTAACAGAATCT
289290291292293294295296297298299300301302303304305306307308309310311312
M V R H I A N E V L G S A K V Q Y N G E T I D L
M V R - - - - - - - - - - - - - - - - - - - - -
ATGGTGAGA---------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E S A W T R L H I V D A V K E A T G V D F Y E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K S D E E A K A L A K E H G I E I K D T M K Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H I L N E F F E Q K V E E T L I Q P T F I Y G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
P T E I S P L A K K N P E D P R F T D R F E L F
- - - - - - - - - - - - - - - - - - - R F E L F
---------------------------------------------------------CGTTTCGAATTGTTC
409410411412413414415416417418419420421422423424425426427428429430431432
I V G R E H A N A F T E L N D P I D Q K G R F E
I - - - E H A N A F T E - - - - - - - - - - - -
ATT---------GAGCATGCAAATGCATTTACTGAA------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A Q L A E K A Q G N D E A H E M D E D Y I E A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E Y G M P P T G G L G I G I D R L V M L L T D S
- - - - P P T G G L G I G I D R L V M L - - - -
------------CCTCCGACAGGTGGTCTTGGTATCGGTATTGACAGATTAGTTATGTTA------------
481482483484485486487488489490491492493494495
P S I R D V L L F P Y M R Q K
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_lys_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D S Q K R H L D E V T G E Y V S K N E L K R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q K L R E K E T K G P A P P A K A A G S G S E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V E G A P E E I D P T K Y F E N R K N E L L A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q K S G R L N P W P H K F V V E M T L A E F R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R Y E G K C S L G E M A E E Q V S V A G R I H S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I R T S G A K L V F Y T I H G D N D R L Q I F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
H V P K E D S R V K L E F D W D T I V S T L H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G D I V G V K G Y P T T T K S G E L S I I P V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L V L L S P C L H M I P N S P S A L T D I N A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F R Q R Y L D F I I N N T G Q K I V Q R S G I I
- - - - - - - - - - - - - - - - - - Q R S G I I
------------------------------------------------------CAAAGGTCGGGCATAATT
241242243244245246247248249250251252253254255256257258259260261262263264
N F I R R F M I D Q R N Y L E V E T P M L Q T V
N F I R R . M I D Q R N Y L E V E T P M L Q - -
AACTTTATCAGGCGT---ATGATTGATCAGAGGAATTACCTTGAAGTGGAGACTCCGATGCTGCAG------
265266267268269270271272273274275276277278279280281282283284285286287288
H G G A A A Q P F V C K S N D L G H D V Y L R I
- - - - - - - - - - - - - - - - - - - - Y L R I
------------------------------------------------------------TACTTGCGCATT
289290291292293294295296297298299300301302303304305306307308309310311312
A P E L F L K R L V V G G L N R V F E I N K N F
A P E L F L K - - - - - - - N R V F E I N K N F
GCTCCCGAGCTGTTCCTCAAG---------------------AATAGGGTTTTTGAGATAAACAAGAACTTC
313314315316317318319320321322323324325326327328329330331332333334335336
R N E S S D Q T H S P E F T M M E A Y S A Y D D
R N - - - - - - - - P E F T M M E A Y S A - - -
CGCAAC------------------------CCAGAGTTTACCATGATGGAAGCATATTCCGCG---------
337338339340341342343344345346347348349350351352353354355356357358359360
L E D M C D L I E G L V S R L V R W Y N I T Y N
L E D M C D L I E G L V S - - - - - - - - - - -
CTGGAAGATATGTGTGACCTCATTGAGGGCCTTGTTTCG---------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H V R L P D E K K H Y K L T F V S H K G E T Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I D F S R P W R R V P I I E T L E Q L L S I K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P R P L D G E E C N G F L V S L L E R L D L E C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K P P L T T A R M L D K L V E R Y L E T L T P N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P I F L M Y H P V L M S P L A K P H R S I P E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A E R F E V F I S C F E V S N A Y T E L N N P I
- - R F E V F I - - - E V S N A Y T E L N N P I
------CGCTTCGAGGTCTTCATC---------GAGGTCTCTAATGCCTATACAGAGCTGAATAATCCCATT
505506507508509510511512513514515516517518519520521522523524525526527528
I Q R E N F Q A Q I R D K A A G D M D A M E Y D
I Q R E N F Q A Q I R - - - - - - - - - - - - -
ATTCAGAGGGAGAATTTCCAGGCTCAAATACGA---------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E D F C K C L D Y G L P P T G G I G I G I D R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V M L L T N S S T I R E V I A F P L M G R L V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_lys_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q A Q D L R S A G K E P Y A Y T Y E R T H M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A A L H E Q F R D L P D G E M A D L Q V A V A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R V M A R R F M G K L A F M S L V D D S G S I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I Y L D K A V L D A A E E D T F K S L K G L I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A G D I I G A R G G M K R T E K G E L S L V A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S V Q M L T K S L A P L P D K W H G L A D I E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R Y R Q R Y V D L I V T E G V K G T L R A R A R
- - - - - - - - - - - - - - - - - - - - A R A R
------------------------------------------------------------GCGCGTGCCCGC
169170171172173174175176177178179180181182183184185186187188189190191192
M M G A L R R T L E A R G F L E V E T P V L E T
M M G A L R R T L E A R G F L E V E T P V L E -
ATGATGGGGGCGTTGAGGCGAACGCTGGAGGCGCGGGGATTCTTGGAAGTGGAGACGCCCGTCCTGGAA---
193194195196197198199200201202203204205206207208209210211212213214215216
S A G G A D A R P F T T F H N A L Q Q P Y V L R
- - - - - - - - - - - - - - - - - - - - - V L R
---------------------------------------------------------------GTACTGCGC
217218219220221222223224225226227228229230231232233234235236237238239240
I A T E L H L K R L A V G G M E R I Y E I G R V
I A T E L H L K - - - - - - - E R I Y E I G R V
ATCGCCACAGAGCTGCACCTGAAG---------------------GAGCGAATCTACGAGATCGGACGCGTG
241242243244245246247248249250251252253254255256257258259260261262263264
F R N E G V S T R H N P E F T T L E L Y Q A Y A
F R N - - - - - - - - P E F T T L E L Y Q A - -
TTCCGCAAC------------------------CCTGAGTTCACCACCCTCGAATTATACCAGGCG------
265266267268269270271272273274275276277278279280281282283284285286287288
D Y H D M M D L T E D L V R A A A A E V A G S H
- Y H D M M D L T E D L V R - - - - - - - - - -
---TACCACGACATGATGGATCTCACAGAGGATCTTGTCAGG------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A V V Y Q G Q S L D F G P A F R R A S M H D L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K E I T G L D F A A F G N L E D G R S A T L A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K E T N P A S S L T I K A V K G A S S L G V L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N E V F E A E V E Q H L V Q P T F V I D H P V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I S P L A K P H R A K P G L V E R F E L F I Y G
- - - - - - - - - - - - - - - - R F E L F I - -
------------------------------------------------CGGTTCGAGCTGTTCATC------
409410411412413414415416417418419420421422423424425426427428429430431432
R E L A N A Y S E L T D P V D Q R Q R L E A Q L
- E L A N A Y S E L T D P V D Q R Q R L E A Q L
---GAGCTGGCGAACGCATACAGCGAGCTGACGGACCCGGTGGACCAGAGGCAGCGGCTGGAGGCGCAGCTG
433434435436437438439440441442443444445446447448449450451452453454455456
T E R A A R A A A S G Q P R G V V L D E D F I R
T - - - - - - - - - - - - - - - - - - - - - - -
ACC---------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A L E Y G L P P T G G M G M G L D R L C M L L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499
D S P S I R D V I A F P L L K R L N E
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_lys_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E L R E T R L E K A Q I L N S L G Q G P Y A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I R F E P T H H N S I L Q E S Q Y D L F N G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R N L T V A I A G R V M A K R V M G K L A F F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L A D E T G L I Q L Y I E K A T L A I S M S G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S L A F S H L T S L V D T G D L I G I Y G T L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R T E R G E L S V R V K K W H M L T K S L H P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P D K W H G L A D V E K R Y R Q R Y L D L I V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P Q T R E T L R R R A Q V V S G I R R W L D E R
- - - - - - - - R R A Q V V S G I R R W L D E R
------------------------AGACGGGCACAGGTAGTTAGTGGTATAAGGCGTTGGCTTGACGAACGA
193194195196197198199200201202203204205206207208209210211212213214215216
E F L E I E T P V L H V E A G G A E A R P F I T
E F L E I E T P V L H - - - - - - - - - - - - -
GAATTTCTCGAAATTGAAACTCCTGTATTACAT---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q H N T L D L P L Y L R I A T E L H L K R L V V
- - - - - - - - - Y L R I A T E L H L K - - - -
---------------------------TATTTACGTATTGCTACAGAGCTACATTTAAAA------------
241242243244245246247248249250251252253254255256257258259260261262263264
G G F E R V Y E L G R I F R N E G V S S R H N P
- - - E R V Y E L G R I F R N - - - - - - - - P
---------GAACGAGTATATGAATTGGGTCGAATATTTCGTAAC------------------------CCT
265266267268269270271272273274275276277278279280281282283284285286287288
E F T S V E I Y Q A Y A D Y T D M M D L T E Q L
E F T S V E I Y Q A - - - Y T D M M D L T E Q L
GAATTTACATCTGTAGAGATATACCAAGCT---------TATACAGATATGATGGATCTCACAGAACAGTTG
289290291292293294295296297298299300301302303304305306307308309310311312
I D T I A N Q V C G T S K I E Y Q E E I I D L T
I D - - - - - - - - - - - - - - - - - - - - - -
ATCGAT------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P P W R R A T M H E L V K E A T G L D F T L F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D Y E T A S E A I T L S G I M L S K L D A Q S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V G H L L N Y I F E N A V E H T L I Q P T F V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D Y P I E I S P L A R K H R N K S G L V E R F E
- - - - - - - - - - - - - - - - - - - - - R F E
---------------------------------------------------------------CGTTTTGAA
409410411412413414415416417418419420421422423424425426427428429430431432
L F I V G R E T A N A F S E L I D P I D Q R E R
L F I - - - E T A N A F S E - - - - - - - - - -
CTTTTTATA---------GAAACCGCGAACGCCTTTAGTGAA------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L E A Q Q L R R Q A G D L E A N M I D E D F L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A L E V G M P P T G G L G I G I D R L T M L L T
- - - - - - P P T G G L G I G I D R L T M L - -
------------------CCTCCTACTGGTGGCTTAGGCATAGGTATTGATAGATTGACGATGCTA------
481482483484485486487488489490491492493494495496497498499500501502503504
N S P S I R D V I A F P L L K P E S Q T Q T E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519
R S Q L G T P T L D N G Q S R
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_lys_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T K N N S N V P E I S D E E F Y K N R L L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V T E Q L K D N V Q V Y P H K Y E V N Y R F K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I F T F K D A S E E D L K K V K V Q S A G R I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N F R I H A R Y S F F Q V M S E D F T I Q L V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D A Q V L E N K D I I S N I K R G D I V G F S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V L G R T K T K E F S V F I K E L S I L T P C L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R T I P T D Y Y G L K D P E I I Y R K R Y L D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L I N K E S K N R F I Q R T N I I K F I R K Y L
- - - - - - - - - - - Q R T N I I K F I R K Y L
---------------------------------AAGTTCTTCAAGCATATGAAATCTAGCAAAAGGTCTAGC
193194195196197198199200201202203204205206207208209210211212213214215216
D D K D F V E V E T P L L N I I P T G A A A K P
D D K D F V E V E T P L L N - - - - - - - - - -
AAAATTGATTTCCACTGGTTTAACTTCCTTCTCTCGTTTATT------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F T T H H N E L K M N L F L R I A P E L Y L K K
- - - - - - - - - - - - F L R I A P E L Y L K -
------------------------------------CATGTTCATCATATCATTATAATCAGCATATGC---
241242243244245246247248249250251252253254255256257258259260261262263264
L V I G G M D R V Y E I G K L F R N E G I D L T
- - - - - - D R V Y E I G K L F R N - - - - - -
------------------AAATTCGGGATTATGAGTTAAATCAATACCTTCATT------------------
265266267268269270271272273274275276277278279280281282283284285286287288
H N P E F T A C E F Y M A Y A D Y N D M M N M A
- - P E F T A C E F Y M A - - - Y N D M M N M A
------AACTCTATCCATTCCCCCAATAACTAACTTTTT---------CTCGGGGGCAATCCTAAGAAATAA
289290291292293294295296297298299300301302303304305306307308309310311312
E E M L N G M C K Y L H G S E K I V Y A P N K R
E E M L N - - - - - - - - - - - - - - - - - - -
ATTCATTTTTAATTC---------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E K E V K P V E I N F A R P F A R F H M L E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S K V V G I K L D G L N I N S D E T L D L L I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T C D K Y E I K V E Q P K T L T R V L D K L V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
H F I E P K C I N P S F I I G Y P L V T S P L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K N H R S E A G M V E R F E L F I N G K E I C N
- - - - - - - - - - - R F E L F I - - - E I C N
---------------------------------TACAACAAGCTGTATGGT---------TGACATAACTTG
433434435436437438439440441442443444445446447448449450451452453454455456
A Y T E L N N P I E Q R M R F K M Q A Q D I N D
A Y T E L N N P I E Q R M R F K M Q A Q - - - -
GAAAAAAGAATACCTAGCATGAATTCTAAAATTTAAAATTCGCCCTGCTGACTGAACTTT------------
457458459460461462463464465466467468469470471472473474475476477478479480
G D D E A M I T D E D F C V A L E Y G L P P T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G F G M G I D R L T M F M T D A A N I K D V I L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514
F P A M K P E S D N
- - - - - - - - - -
------------------------------
Class II
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_lys_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_lys_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P C L S Y I L A A L V E T I I R L L F F F N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F V R M S T E M N N Q S Q I S D T L D S V H Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D N R Y K M M E C I K D A G R P F Y P H K F K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S M S L P A Y A L K Y G N V E N G Y I D K D T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L S L S G R V T S I R S S S S K L I F Y D I F C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E E Q K V Q I I A N I M E H D I S T G E F S V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
H S E I R R G D V V G F T G F P G K S K R G E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L F S K S V V L L S P C Y H M L P T A I S G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K D Q E V R Y R Q R Y L D L M L N E E S R K V F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K L R S R A I K Y I R N Y F D R L G F L E V E T
- L R S R A I K Y I R N Y F D R L G F L E V E T
---CTAAGAAGCAGAGCTATTAAATATATTAGGAATTATTTTGATAGACTCGGGTTTTTAGAAGTAGAAACT
241242243244245246247248249250251252253254255256257258259260261262263264
P M L N M I Y G G A A A R P F I T Y H N E L E T
P M L N - - - - - - - - - - - - - - - - - - - -
CCTATGTTAAAT------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q L Y M R I A P E L Y L K Q L I V G G L D K V Y
- - Y M R I A P E L Y L K - - - - - - - D K V Y
------TATATGAGAATTGCTCCAGAGCTCTATTTAAAA---------------------GACAAAGTATAT
289290291292293294295296297298299300301302303304305306307308309310311312
E I G K N F R N E G I D L T H N P E F T A M E F
E I G K N F R N - - - - - - - - P E F T A M E F
GAAATAGGAAAAAACTTTAGGAAT------------------------CCTGAGTTCACAGCAATGGAGTTT
313314315316317318319320321322323324325326327328329330331332333334335336
Y M A Y A D Y Y D L M D L T E E L I S G L V L E
Y M A - - - Y Y D L M D L T E E L I S - - - - -
TACATGGCA---------TATTATGATTTAATGGATCTGACTGAGGAGTTAATAAGT---------------
337338339340341342343344345346347348349350351352353354355356357358359360
I H G S L K I P Y H P D G P E G K C I E I D F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T P W K R F S F V E E I E S G L G E K L K R P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D S Q E N I D F M V E M C E K H E I E L P H P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T A A K L L D K L A G H F V E T K C T N P S F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I D H P Q T M S P L A K W H R E K P E M T E R F
- - - - - - - - - - - - - - - - - - - - - - R F
------------------------------------------------------------------AGATTC
457458459460461462463464465466467468469470471472473474475476477478479480
E L F V L G K E L C N A Y T E L N E P L Q Q R K
E L F V - - - E L C N A Y T E L N E P L Q Q R K
GAGCTTTTCGTT---------GAACTTTGTAATGCATATACTGAATTAAACGAACCTCTACAACAAAGAAAA
481482483484485486487488489490491492493494495496497498499500501502503504
F F E Q Q A D A K A S G D V E A C P I D E T F C
F F E Q Q A D - - - - - - - - - - - - - - - - -
TTTTTTGAACAGCAGGCTGAT---------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L A L E H G L P P T G G W G L G I D R L I M F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A D K N N I K E V I L F P A M R N V K Q N A Q H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559
S N Q H S G N
- - - - - - -
---------------------
Class II
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_pheALPHA_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I V L R P K E Y E V Y K K L I N G Y S N E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N L L G M D E E E L L K I A Y N L Q Q K G L V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I K E E K D T Y Y V L T E K G K K S Y K N L P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R K L Y S L L E L H G E L P L D Q I P L T K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K A I A I G A L K N L D L I E I K D G K I K L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R E I K E F P W E P L L L A I N E G L K K D L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N L K E I E A K L G K K I D T K Y L D Y L K K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G L V K E E T K T R F Y I E V I P K D V V E G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D K I D T E V L Q K K L Y K E K P I A P Y N I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E F P K Y Y G G K P H Y Y R E Y L N W V R K K M
- - - - - - - - - - - Y Y R E Y L N W V R K K M
---------------------------------TGGGATTAATTCATATTCCATAGCATTTAGCTCTTTCCA
241242243244245246247248249250251252253254255256257258259260261262263264
V N L G W K E L N A M E Y E L I P M F W C F E A
V N L G W K E L N A . E . E L I - - - - - - - -
TCCGAGGTTTACCATTTTTTTCCTAACCCA---TAA---TTCTCTATA------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L F T P Y D H P S R E L A E S F I I E G K P E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D V P K D I E E K V K E K H L Q Y F G N Y L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E A H L T I L R S Q N T A I T A W N L Y N L R D
- - - - - I L R S Q N T A I T A - - - - - - - -
---------------TTTCTTTAAATAATCTAAATATTTGGTATCGAT------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I L N N E K G K Y F Y I G S V W R P D T I D K T
- - - - - - G K Y F Y I G S V W R P - - - - - -
------------------GTCTTTCTTTAACCCTTCGTTTATTGCTAATAATAA------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H H I E F Q Q L E G I I I G S N M A Q L K T E I
- - I E F Q Q L E G I I I - - - - - Q L K T E I
------CTCTCTCTTTAGTTTTATTTTCCCATCTTTTAT---------------ATTCTTTAATGCCCCAAT
385386387388389390391392393394395396397398399400401402403404405406407408
E K I L K A L G F E K I K L F P A F F P F T E P
E K I L K - - - - - - - - - - - - - - - - - - -
TGCAATGGCTTTTTC---------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S V E V Y A Y H S K L G W V E V A G A G M L R K
S V E V Y A - - - - - - - - E V A G A G M L - -
ATATAATTTTCTTTCAGG------------------------TTTTTCCGTTAAAACATAGTATGT------
433434435436437438439440441442443444445446447448449450451452453454455456
Q I L D S F G I K H K I G A F G I G I N R L A M
- - - - - - - - - H K I G A F G I G I N R L A M
---------------------------TTGTTGCAAATTATATGCTATTTTTAGCAATTCTTCTTCATCCAT
457458459460461462463464465466467468469470471472473474475476477478479480
I A L G I D D I R D L Y G Q D I D K I R E W P I
I - - - - - - - - - - - - - - - - - - - - - - -
CCC---------------------------------------------------------------------
481482483
K Y F
- - -
---------
Class II
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_pheALPHA_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L V L P L P L Y E I I R H A P E W K P L E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A R E L G S S V D S L M R Y V E E G R A K G V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R V E R K V I E F Y E L T E E G R Q R A A E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P E Y K L L K S A V C R E G R C T A H L S Q H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E A Q I A L A N L A K L G V K P R G N V V E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E E T Y K K I V A M L E E K Q K A L A A P H S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P P E V L K E F I K R K L V R K I E K T Q V Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K A A V P L E L V K P A E V K T V I T S E D I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T G R W R N Y T L K P F D L N I E P P E Y P A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V P H F F N E F L D Y V R E V M I G L G F E E V
- - - F F N E F L D Y V R E V M I G L G F E E V
---------GTAAAAAGTGTCGTGCACCTCCCTCGCGGGGTGGTCCTGCGCTTGGAACAACGCGTCAAAATT
241242243244245246247248249250251252253254255256257258259260261262263264
R G P V L E V E F W N F D A L F Q A Q D H P A R
R G - V L E - - - - - - - - - - - - - - - - - -
CCAAAA---CACCTCCAG------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E V H D T F Y V Q W S G P L E T P P E H L M E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V G R V H E E K W R Y K W D R K K A L N P V L R
- - - - - - - - - - - - - - - - - - - - - V L R
---------------------------------------------------------------CTCAGCCGG
313314315316317318319320321322323324325326327328329330331332333334335336
T Q T T A T T I R A L A E R G D G E Y K V F T I
T Q T T A T T I - - - - - - - - - - Y K V F T I
CTTTACTAACTCCAAGGGGACTGC------------------------------TTTCCTGACGAGTTTTCT
337338339340341342343344345346347348349350351352353354355356357358359360
G R V F R P E K L D P K H S M E F H Q L D G I V
G R V F R P - - - - - - - - M E F H Q L D G I V
CTTTATAAACTCTTTTAA------------------------CGCAGCGAGGGCTTTTTGTTTCTCCTCAAG
361362363364365366367368369370371372373374375376377378379380381382383384
V G P G L T F K H L L G Q L E E I A K A L G M T
V - - - - - F K H L L G Q L E E I A K - - - - -
CAT---------------ATAAGTCTCTTCGTCTAGCTCCACGACGTTTCCCCTAGG---------------
385386387388389390391392393394395396397398399400401402403404405406407408
K V K F R P A Y F P F T S P S V E V Y A Q H P K
- - - - - - - - - - - - - - S V E V Y A - - - -
------------------------------------------GAGGTGAGCTGTGCACCT------------
409410411412413414415416417418419420421422423424425426427428429430431432
L G W V E F G G A G I F R P E V T E P L G V K K
- - - - E F G G A G I F - - - - - - - - - - - -
------------CAATAGTTTATACTCCGGCAACCC------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S R V L A W G W G L D R I A M I L L G I D D I R
S R V L A W G W G L D R I A M I - - - - - - - -
GTAGAATTCAATTACTTTCCGCTCCACGCGCAACACCCCCTTGGCCCG------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E L F T K D L E K L K E Y Y A R W A R Y K A S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489
G A V G T L F T L
- - - - - - - - -
---------------------------
Class II
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_pheALPHA_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K K I A V S E S E Y Q F L K Q L V G R V E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G K A Y T T E E L A K L L G I P R S R V E P L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R L L A D K G L L E I E E Q V V E K Y V V T E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A K Q Y L E E G F P E E K L V K L L H K N G G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L P V D E A R R L L G R E F G I A M A N A S R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G W V R V E A G K V K L L V E P T V E A E E K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L L R L L S E G R R L S P D E V K L L R R R R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V A P E K E K I T I V R F G K S P E E F L E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V V E V G A L T R Q L I E S G E W R N I R L R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y N V A A E P P K V Y P G R L H F F R Q F V E Y
- - - - - - - - - - - - - - - - F F R Q F V E Y
------------------------------------------------TTTTTCCGCCAGTTCGTGGAGTAT
241242243244245246247248249250251252253254255256257258259260261262263264
L R D V M K E L G F V E I E E P P V E L E F W N
L R D V M K E L G F V E I E E P P V E - - - - -
CTACGCGATGTCATGAAGGAGCTAGGGTTCGTAGAGATCGAAGAACCGCCGGTAGAG---------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y D V L F Q P Q Y H P A R S P T D T F Y L R Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R E G V L P A D L A V S V R K A H E E G I A G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R G W G Y R W D P S Q A A R L I L R S H T T A V
- - - - - - - - - - - - - - - I L R S H T T A V
---------------------------------------------ATACTGCGCAGTCATACAACAGCTGTG
337338339340341342343344345346347348349350351352353354355356357358359360
S A R V L A S K P R P P F R F F S L G R V Y R V
S A - - - - - - - - - - F R F F S L G R V Y R V
TCGGCG------------------------------TTCAGATTCTTTAGCCTCGGTAGAGTATACCGTGTA
361362363364365366367368369370371372373374375376377378379380381382383384
E T I D P R H L P E F H Q I D G I A S E D G I S
- - - - - - - - P E F H Q I D G I A S - - - - -
------------------------CCGGAGTTCCACCAGATAGATGGTATTGCGAGC---------------
385386387388389390391392393394395396397398399400401402403404405406407408
L R W L I G M L S E F L E R L G F R E Y K F R P
L R W L I G M L S E F L E - - - - - - - - - - -
CTCCGGTGGCTCATAGGGATGCTCTCAGAGTTCCTGGAG---------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A Y F P F T E P S I E G Y V R V K G Q W L E I L
- - - - - - - - S I E G Y V - - - - - - - E I L
------------------------TCCATAGAGGGCTATGTC---------------------GAGATACTT
433434435436437438439440441442443444445446447448449450451452453454455456
G A G M F R P E M L A A L G I D Y P V A A W G M
G A G M F - - - - - - - - - - - Y P V A A W G M
GGCGCGGGCATGTTT---------------------------------TATCCGGTTGCAGCATGGGGTATG
457458459460461462463464465466467468469470471472473474475476477478479480
G I E R L A M A L Y G L T D I R Q L Y S M D V R
G I E R L A M A - - - - - - - - - - - - - - - -
GGCATAGAGAGGCTAGCCATGGCC------------------------------------------------
481482483484485486487488489490491492493494495496497
F L S T I P S R W W I Y A G A Q V
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_pheALPHA_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R L G Y N E K L V L L K L A E L K N A T V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L I E K T N L D Q V A V M R A L L T L Q S Q G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A K V H E E R R R M I K L T E T G K R Y I E I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L P E I R A L K I L K E K G K V T L N D L K D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L S D E E L K A I V G V L R K E G W A E V S K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K E G L T L K L S E K G K K A E K R A I D I A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E V L S K G E V S V E E I E K I I S V K E L K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R K I A E E E E K V I R N V E I T D K G L E L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E K G I E L K R E V S I L T P E L I V T G K W R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E V E F K P F N I K A P V K K I Y P G K K Q P Y
- - - - - - - - - - - - - - - - - - - - - - P Y
------------------------------------------------------------------ATCGAC
241242243244245246247248249250251252253254255256257258259260261262263264
R V F L D K I R R R L I E M G F I E M T V D S L
R V F L D K I R R R L I E M G F I E M T V . S L
AGTCATTTCAATGAATCCCATTTCTATTAGCCTTCTTCTTATTTTATCCAAGAAGACTCTATA---CTGCTT
265266267268269270271272273274275276277278279280281282283284285286287288
I E T Q F W N F D A L F Q P Q N H P A R E W T D
I E - - - - - - - - - - - - - - - - - - - - - -
TTTCCC------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
T Y Q L K Y P E K G Y L P D E N L V S K V K E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H E R G L A G S R G W G Y V W S P E R A M L L M
- - - - - - - - - - - - - - - - - - - - - - - M
---------------------------------------------------------------------CTC
337338339340341342343344345346347348349350351352353354355356357358359360
P R A H A T A L S A R E L A K G I E I P G K Y F
P R A H A T A L S A - - - - - - - - - - G K Y F
TTTAACTGAAATTATCTTTTCAATTTCTTC------------------------------TAAAGCTATATC
361362363364365366367368369370371372373374375376377378379380381382383384
T I Q R V F R P D V L D R T H L I E F N Q I D G
T I Q R V F R P - - - - - - - - I E F N Q I D G
AATAGCTCTTTTTTCAGCTTTTTT------------------------AAGACCTTCTTTAGTTTTACTAAC
385386387388389390391392393394395396397398399400401402403404405406407408
F V A S E D L T F R H L L G I L K R F A I E I A
F V A - - - - - F R H L L G I L K R F A I - - -
TTCAGCCCA---------------TACTCCAACTATGGCCTTTAGCTCCTCATCACTTAAGAC---------
409410411412413414415416417418419420421422423424425426427428429430431432
G A K K V K F F P D Y Y P F T E P S V Q L S A Y
- - - - - - - - - - - - - - - - - S V Q L S A -
---------------------------------------------------TTCTGGAAGTCCGATTTC---
433434435436437438439440441442443444445446447448449450451452453454455456
H P E L G W V E F G G A G I F R E E M T E A L G
- - - - - - - E F G G A G I F - - - - - - - - -
---------------------TAATTTTATCATCCTTCTCCTTTC---------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I K V P V I A W G I G I D R L A M F K L G V D D
- - V P V I A W G I G I D R L A M F - - - - - -
------TGTTAAAAGAGCCCTCATCACTGCTACTTGATCTAAATTTGTCTTTTC------------------
481482483484485486487488489490491492493494495496497498499
I R Y L F S Y D L K W L R E S K L I W
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_pheALPHA_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G A R I P V S E S E Y R L L E R L V G R V E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G K P Y T T E A L A R L T G L D R S Q V E A L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R L L A E K G L L Q L E E R V S E R Y R L T E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A E R Y L R E G F P E E R L A R L L A E H G G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M P V E E A R R L L G G E F G I A M A N A S R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G W V R V E S G E I V L A A E P P L V A E E R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L L E R L S R G E R V S G D D L R M L R R R R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V E P V K E K A T F I T L E E P P E K L L G R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E V E V G A L T R R M L E T G E W R R V R L R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y N V A A E P P R L Y P G R L H F F R Q L I E H
- - - - - - - - - - - - - - - - F F R Q L I E H
------------------------------------------------GTCATAGTTCCAGAACTCCAGCTC
241242243244245246247248249250251252253254255256257258259260261262263264
I R D V M K E L G F V E V E E P P V E L E F W N
I R D V M K E L G F V E V E E P P V E - - - - -
CACCGGCGGCTCCTCGACCTCCACGAAGCCGAGCTCCTTCATGACATCGCGTATATG---------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y D V L F Q P Q Y H P A R S P T D T F Y L R Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R E G E P P R E L A E M V R R A H E E G L A G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R G W G Y R W D P S R A A R L I L R S H T T A V
- - - - - - - - - - - - - - - I L R S H T T A V
---------------------------------------------CGGCTCGACCAGCCTGCGGCGGCGGAG
337338339340341342343344345346347348349350351352353354355356357358359360
S A R V L A Q R P R P P F R F F S I G R V Y R V
S A - - - - - - - - - - F R F F S I G R V Y R V
CATCCT------------------------------GCTAAGCCTCTCCAGGAGACGACGCTCCTCAGCAAC
361362363364365366367368369370371372373374375376377378379380381382383384
E T V D P H H L P E F H Q V D G I A S E D G V S
- - - - - - - - P E F H Q V D G I A S - - - - -
------------------------TATCTCACCAGACTCGACGCGTACCCAACCCTT---------------
385386387388389390391392393394395396397398399400401402403404405406407408
L R W L M G M L G E L L E R L G L R E Y R F R P
L R W L M G M L G E L L E - - - - - - - - - - -
CATAGCTATGCCGAACTCACCGCCCAGCAGCCTCCTGGC---------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A Y F P F T E P S L E G Y V R V G S Q W L E V L
- - - - - - - - S L E G Y V - - - - - - - E V L
------------------------CGGGAAGCCCTCGCGGAG---------------------TAGCCTATA
433434435436437438439440441442443444445446447448449450451452453454455456
G A G L F R P E M L A A L G I D Y P V A A W G M
G A G L F - - - - - - - - - - - Y P V A A W G M
GCGCTCAGAGACACG---------------------------------GAGCCTTGCCAGAGCCTCCACCTG
457458459460461462463464465466467468469470471472473474475476477478479480
G I E R L A M A L Y G L S D I R Q L Y S S D A R
G I E R L A M A - - - - - - - - - - - - - - - -
GCTGCGGTCGAGGCCGGTAAGCCT------------------------------------------------
481482483484485486487488489490491492493494495496497
F L S T I P S R W R L Y A G A P V
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_pheALPHA_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q E E L E A L R H A I E T T P I D S E E A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A F R I R F L G Q R S G Q I T H L F K R I R E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P P E E R P R I G Q Q L N A L K R L A E Q R L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E A R A R L R R A A R P R T E V P D L T L P G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R T F T G S L H P L T R T L E A I V R V F E Q L
- - - - - - - - P L T R T L E A I V R V F E Q L
------------------------CAGGTAGAGCACCTGCTTCAGGTCACCCATCGACACGTTTCGATCCAC
121122123124125126127128129130131132133134135136137138139140141142143144
G F S V A E G P E I E D D W H N F T A L N F P P
G F S V A E G P E I E - - - - - - - - - - - - -
GTAGAGCCCTTCGACCTGGTGAAACAGGCAGAA---------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D H P A R D M Q D T F F L H Q G A S H Q E A V V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GCG
169170171172173174175176177178179180181182183184185186187188189190191192
L R T H T S P V Q I R V M E R M A P P I R I I A
L R T H T S P V Q I - - - - - - - - - I R I I A
GAGCACGACGGCCTCCTGATGGGAAGCGCC---------------------------GTCGCGGGCCGGGTG
193194195196197198199200201202203204205206207208209210211212213214215216
P G R V Y R N E A V S Y K S F C L F H Q V E G L
P G R V Y R N - - - - - - - - C L F H Q V E G L
GTCCGGCGGGAAGTTCAGCGC------------------------GATTTCCGGGCCTTCGGCCACCGAAAA
217218219220221222223224225226227228229230231232233234235236237238239240
Y V D R N V S M G D L K Q V L Y L F A R A L F G
Y V - - - - - M G D L K Q V L Y L F A R - - - -
GCCGAG---------------GACGATGGCTTCGAGTGTCCGGGTCAGCGGATGGAGCGA------------
241242243244245246247248249250251252253254255256257258259260261262263264
E D V R M R F R P S F F P F T E P S A E V D I W
- - - - - - - - - - - - - - - - - S A E V D I -
---------------------------------------------------CCGGCGCAGGCGGGCACG---
265266267268269270271272273274275276277278279280281282283284285286287288
W P L P D H P E G G Q W M E I L G C G M V H P N
- - - - - - - - - - - - - E I L G C G M V - - -
---------------------------------------CAGTTGCTGGCCGATGCGGGGACG---------
289290291292293294295296297298299300301302303304305306307308309310311312
V F R A V G I D P E Q Y T G Y A F G M G V E R I
- - - - - - - - - - - Y T G Y A F G M G V E R I
---------------------------------GATCTGACCGCTGCGCTGTCCCAGAAAGCGAATGCGGAA
313314315316317318319320321322323324325326327328329330331332333334335336
A M L R Y G I D D I R L F Y E N D L R F L E Q F
A M L - - - - - - - - - - - - - - - - - - - - -
GGCCTCGGC---------------------------------------------------------------
Class II
Archaea/Staphylothermus marinus/Smarinus_pheALPHA_aa
Archaea/Staphylothermus marinus/Smarinus_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S Q D S D D K Y Y L P N R Q Y R I V E V L L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S G S L S V E E L A R A L D E K P E N I M R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A E L E A K G L L R V I R K I K Q V P V I T D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G R E V L S S R T P E E R V F R V M Y R C V G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N V E D F L E C V S S E A G I E K Q K A Q I G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q H L V R N K C L S V M S G V V V V G D E Y G C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
H K A I E E A S I I R S A L E K I M R G E T V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D N I I N I L K R R R M I R T E K K T I I I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P S D V L E K L F R E G L I T R R E L L T V V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P K P K D E L E K Y V I K E F D L T V P P P K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V G G R L N A Y I E F L D L V R D I L V S M G F
- - - - - - A Y I E F L D L V R D I L V S M G F
------------------TAATTCAACATGTGGGCCTTTAACTTCTTCAAAACCCATGGAGACCAGTATATC
265266267268269270271272273274275276277278279280281282283284285286287288
E E V K G P H V E L E F W N F D A L F Q A Q D H
E E V K G - H V E - - - - - - - - - - - - - - -
ACGGACAAGGTCGAG---CTCTATATA---------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P A R E I H D T F F L K M D F K G K V P E E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S R A G K I H E R G W G Y K W D P I R A L R P I
- - - - - - - - - - - - - - - - - - - - - - - I
---------------------------------------------------------------------CTT
337338339340341342343344345346347348349350351352353354355356357358359360
L R S Q T T A V S V R A I Y E R G E G E Y R V F
L R S Q T T A V S V - - - - - - - - - - Y R V F
CTCGGTTCTTATCATTCGTCTACGTTTTAG------------------------------GCCACGCATTAT
361362363364365366367368369370371372373374375376377378379380381382383384
S L D R V F R P E T L D A K H A M E F Y Q L D G
S L D R V F R P - - - - - - - - M E F Y Q L D G
TTTTTCGAGAGCAGACCTTATGAT------------------------ACAACCATATTCATCGCCTACAAC
385386387388389390391392393394395396397398399400401402403404405406407408
V I V G K N V T F K H L L A F F K E F A A A L G
V I V - - - - - F K H L L A F F K E F A A - - -
AACGACTCC---------------ACATTTATTCCTGACTAGATGTTGGAAGCCTATTTGGGC---------
409410411412413414415416417418419420421422423424425426427428429430431432
I R E V W F K P G Y F P F T E P S V E G F I K H
- - - - - - - - - - - - - - - - S V E G F I - -
------------------------------------------------CCTACCAACACATCTATA------
433434435436437438439440441442443444445446447448449450451452453454455456
P H L G W I E V F P G G V F R P E V M E I L G A
- - - - - - E V F P G G V F - - - - - - - - - -
------------------CGGTGTTCTTGAACTAAGAACTTC------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P G V R A I A W G I G I D R L A M A V L G L D D
- - V R A I A W G I G I D R L A M A - - - - - -
------TTTACGGATTACTCTAAGTAACCCTTTAGCTTCGAGCTCAGCTAGATC------------------
481482483484485486487488489490491492493494495496497498499500501502503504
I R D L F S K D L D F L Q K L P T P I L P Y F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519
S K T Q G S D V R V V S V P K
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_pheALPHA_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E I S K N E A L I L K Y L A S K N Q E I E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S N I E I K G L S R Q D I A S A T S W L Q V K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L I D V K T R E E V A Y V L T D E G K R Y A E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G L P E L R A Y S I L K R K G K L S L R D L Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A M P D E Y K I V L A Q L A K F G I T P K N G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L E Y S D G H I E A E I S R R Q R F L S D L N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D D Q E M I E H F K R R K N V I E E K K R S V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I V S I N S K G L E Q L N N F D Q F E A I G E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D S G I I T S Q A W K T A P F R K Y D L D A P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S P T K S Y A K H P L V Y F I N E I R R I F L D
- - - - - - - - - P L V Y F I N E I R R I F L D
---------------------------CCGTTAGTATACTTTATCAATGAGATAAGGCGGATATTCTTAGAT
241242243244245246247248249250251252253254255256257258259260261262263264
M G F T E M S G H Y I E S A L W D M D A L F I P
M G F T E M S G H Y I E - - - - - - - - - - - -
ATGGGTTTTACCGAGATGAGTGGACATTATATAGAA------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q D H P A R D M Q D T F Y V K D S N F T I E H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E I E K R I K R I H E R G F D G Y S G W G Y R W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S S D D G K K L I L R T H T T V T T A R Y L Y E
- - - - - - - - I L R T H T T V T T A - - - - -
------------------------ATACTCAGGACGCATACAACGGTAACTACTGCC---------------
337338339340341342343344345346347348349350351352353354355356357358359360
H N T Y P Q A I F S V E K V F R H E S V D W K H
- - - - - Q A I F S V E K V F R H - - - - - - -
---------------CAGGCGATATTTTCAGTGGAAAAAGTATTCAGGCAC---------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L A E F Y Q I E G A V Y D K N V S V A T L K W I
- A E F Y Q I E G A V Y - - - - - V A T L K W I
---GCAGAATTTTACCAGATAGAAGGCGCAGTATAT---------------GTTGCGACGCTTAAATGGATA
385386387388389390391392393394395396397398399400401402403404405406407408
L R T F Y G K L G F E K I R L V P S Y Y P Y T E
L R T F Y G - - - - - - - - - - - - - - - - - -
CTCCGCACGTTCTATGGT------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P S L D V V V E V D G K E M E L G G S G I F R P
- S L D V V V - - - - - - - E L G G S G I F - -
---AGCCTGGACGTGGTTGTG---------------------GAACTCGGTGGTTCAGGTATATTT------
433434435436437438439440441442443444445446447448449450451452453454455456
E V G K I L G L K A P V M A W G M G L E R L A M
- - - - - - - - - A P V M A W G M G L E R L A M
---------------------------GCCCCTGTTATGGCTTGGGGGATGGGCTTGGAACGTTTAGCTATG
457458459460461462463464465466467468469470471472473474475476477478479480
L Y Y G L T D V R D L Y N T D F S F L E G Y K I
L - - - - - - - - - - - - - - - - - - - - - - -
CTC---------------------------------------------------------------------
481482
K Y
- -
------
Class II
Archaea/Archaeoglobus fulgidus/amino acid sequences/pheALPHA_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L S K I E L M L L R S L E T G K T Y T P E E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A E L S G L S K D A V L K A A Y M L Q E R G Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R V I E N V R T H Y S L T E E G E R Y L K E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P E E K L Y S L V K S G V N S M D E L R K R M G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R E F Q I A L G W L R R K G A V E V E G D K V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P K R E P S F D E R A A L Q A I K E G R G V D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G T L K T L M K R K L V T K S E T K Q V Y I E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L K K P E I E L E D I I T D L T P E M L L E G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
W R G K R F L K Y D I T I P A K E I Y G G K I H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P Y E R I I E E C R K V F L E M G F T E I K G H
P Y E R I I E E C R K V F L E M G F T E I K G H
CCGTATGAGAGAATAATCGAGGAGTGCAGAAAGGTGTTCCTCGAAATGGGCTTTACTGAGATAAAGGGTCAC
241242243244245246247248249250251252253254255256257258259260261262263264
Y V Q P A F W N F D A L F Q P Q D H P A R D M Q
Y V Q - - - - - - - - - - - - - - - - - - - - -
TACGTCCAG---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D T F Y L D R Y I D L E G E I V E R V K A T H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N G W I T G S T G W G G E W S L E K A R Q L V L
- - - - - - - - - - - - - - - - - - - - - - V L
------------------------------------------------------------------GTTCTC
313314315316317318319320321322323324325326327328329330331332333334335336
R T H T T A I T I H Y L A E N P E P P Q K A F C
R T H T T A I T I - - - - - - - - - - Q K A F C
AGAACCCACACAACAGCAATAACCATA------------------------------CAAAAGGCCTTCTGC
337338339340341342343344345346347348349350351352353354355356357358359360
I D R V Y R R E T I D A T H L P E F D Q L E G V
I D R V Y R R - - - - - - - - P E F D Q L E G V
ATCGACAGGGTTTACAGAAGG------------------------CCAGAGTTCGACCAGCTCGAAGGAGTT
361362363364365366367368369370371372373374375376377378379380381382383384
V L D R D V G F K H L L G L L K E F F T K M G F
V L - - - - - F K H L L G L L K E F F T - - - -
GTCCTC---------------TTCAAGCACCTTCTCGGCTTACTTAAGGAGTTCTTCACG------------
385386387388389390391392393394395396397398399400401402403404405406407408
E D V R F R P G Y F P Y T E P S V E P E V Y V E
- - - - - - - - - - - - - - - S V E P E V - - -
---------------------------------------------AGCGTTGAGCCTGAGGTT---------
409410411412413414415416417418419420421422423424425426427428429430431432
G L G W V E L G G A G V F R K E V T E P L G I R
- - - - - E L G G A G V F - - - - - - - - - - -
---------------GAGCTTGGTGGGGCAGGAGTTTTC---------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G K V L A W G L G I G R L A M L K I G L K D L R
G K V L A W G L G I G R L A M L - - - - - - - -
GGCAAGGTTCTAGCATGGGGACTTGGTATAGGAAGGCTTGCAATGCTC------------------------
457458459460461462463464465466467468469470471472473474
R L Y L P D L G W L R S M P V A R K
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_pheALPHA_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K L P A Q Q A A V L E A A S A D E P R R I D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A A D L G E P P E T V T G A A F E L A D A G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V D V T E E T A D E V E L T D E G R E Y A D T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L P E V R L Y E A A L D A G A D D E P V Q M G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V I G A S G L E G P Q V D I A L S N Y A R K G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G A I E S G A L A A D P S A D P E D D A E A V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L R A L A D D E S V P G D A P L D Q L E R R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V V R R E R T V R S V Q L T E A G V T E L M A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V E A S D A V G Q L T P E L L A S G D W R D A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F A D Y N V E A D A A E H T P G K V H V L R Q A
- - - - - - - - - - - - - - - - - - - V L R Q A
---------------------------------------------------------GTGCTCCGGCAGGCA
241242243244245246247248249250251252253254255256257258259260261262263264
A E R V E E V L V G M G F Q E M E G P H V D A D
A E R V E E V L V G M G F Q E M E G P H V D - -
GCCGAGCGCGTCGAGGAAGTGCTGGTCGGGATGGGGTTCCAGGAGATGGAAGGGCCGCACGTCGAC------
265266267268269270271272273274275276277278279280281282283284285286287288
F Y I N D C L F M P Q D H P A R N H W D R F A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S N P E K I E D L P A D L V D R V E R A H R E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V G P D G D G Y H S P W D E D F A R A L A L R G
- - - - - - - - - - - - - - - - - - - - A L R G
------------------------------------------------------------GCGCTCCGCGGG
337338339340341342343344345346347348349350351352353354355356357358359360
H T T S L T A R Y L S G V A G E D I E P P Q R Y
H T T S L T A - - - - - - - - - - - - - - Q R Y
CACACGACGAGCCTCACCGCT------------------------------------------CAGCGCTAC
361362363364365366367368369370371372373374375376377378379380381382383384
F S V E K A Y R N D T L D A T H L L E F F Q I E
F S V E K A Y R N - - - - - - - - L E F F Q I E
TTCAGCGTCGAGAAGGCCTACCGGAAC------------------------CTGGAGTTCTTCCAGATCGAG
385386387388389390391392393394395396397398399400401402403404405406407408
G W V M A E D L S V R D L M G T F R E F Y S Q F
G W V M - - - - - V R D L M G T F R E F Y S - -
GGCTGGGTGATG---------------GTTCGGGACCTGATGGGGACGTTCCGGGAGTTCTACAGC------
409410411412413414415416417418419420421422423424425426427428429430431432
G I T D L E F K P T Y N P Y T E P S F E L F G R
- - - - - - - - - - - - - - - - - S F E L F G -
---------------------------------------------------AGCTTCGAACTGTTCGGC---
433434435436437438439440441442443444445446447448449450451452453454455456
H P E T G E L I E I G N S G I F R P E M L E P L
- - - - - - - - E I G N S G I F - - - - - - - -
------------------------GAGATCGGGAACTCCGGCATCTTC------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G V E A D V M A W G L A L E R L L M L V T G F E
- - - A D V M A W G L A L E R L L M L - - - - -
---------GCCGACGTGATGGCGTGGGGGCTCGCCCTCGAGCGACTACTGATGCTT---------------
481482483484485486487488489490491492493494495496497498499500501502
D I R D V H G T L C D L E F L R D A E V V Y
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_pheALPHA_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S A Q D N L T I N E K K V L L A L E E L G S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A P D K L E E K S G L Q V D A A M Q A A F M L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E K G L A S V S E K V L E R Y S L T K E G E E Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T K T G L P E R Q I I D A L K A P A P L E E L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S R F S P K T V G I A T G W L I K K G W A K V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N G V M V P S G N A P A G R D E E V L A A F A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K A K T L E E L A A D E G T V K E L L K R K L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I K H E E K S R T V S V T G A G S A L A A E G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V L E E E I A Q L T P E L L K S G A W K G K K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R P Y R L D I A P N P L Y G V K I H P Y R R L I
- - - - - - - - - - - - - - - - - - P Y R R L I
------------------------------------------------------TATGCCGCCTTTGATTTC
241242243244245246247248249250251252253254255256257258259260261262263264
E Q M R Q I F L E M G F T E I K G G I I Q S S F
E Q M R Q I F L E M G F T E I K G G I I Q - - -
CGTGAAGCCCATTTCCAGGAAGATCTGGCGCATCTGTTCAATCAAACGCCTGTAAGGGTGGAT---------
265266267268269270271272273274275276277278279280281282283284285286287288
W N F D A L F Q P Q D H P A R D M Q D T F H L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
S I C Q L P A E Y S D K V A A M H E S G G D I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S C G W G G I W D R E L A R R N V L R T H T T S
- - - - - - - - - - - - - - - - V L R T H T T S
------------------------------------------------GCGCTTGAGCAGTTCCTTTACAGT
337338339340341342343344345346347348349350351352353354355356357358359360
V T I K Y L A D N P E P P V K A F C I D R A Y R
V T I - - - - - - - - - - V K A F C I D R A Y R
TCCTTCGTC------------------------------GCCTGCGAAAGCCGCAAGAACTTCTTCGTCCCT
361362363364365366367368369370371372373374375376377378379380381382383384
R E T I D P T H T P E F E Q L E G V V M D K D M
R - - - - - - - - P E F E Q L E G V V M - - - -
GCC------------------------CATAACTCCGTTTTCAACCTTTGCCCACCCTTT------------
385386387388389390391392393394395396397398399400401402403404405406407408
S F A D L L G L L A E F Y H R M G F E E V R F R
- F A D L L G L L A E F Y H - - - - - - - - - -
---GGTTGCGATCCCCACGGTCTTGGGGGAAAAGCGGCTCCT------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P G Y F P Y T E P S V E P E V Y V D G L G W V E
- - - - - - - - - S V E P E V - - - - - - - - E
---------------------------TCCGGTTTTCGTATATTC------------------------ACG
433434435436437438439440441442443444445446447448449450451452453454455456
L G G A G V F R K E V T E P F G I K E P V L A W
L G G A G V F - - - - - - - - - - - E P V L A W
TTCGAGCACTTTTTCAGATAC---------------------------------TGCCTGCATTGCCGCATC
457458459460461462463464465466467468469470471472473474475476477478479480
G L G V S R L A M L K L G L K D L R L L Y Q S D
G L G V S R L A M L - - - - - - - - - - - - - -
CACCTGCAGCCCGGACTTCTCTTCCAGTTT------------------------------------------
481482483484485486487488489490491492
I D W L R K S E V C R I
- - - - - - - - - - - -
------------------------------------
Class II
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_pheALPHA_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q L T L N E K R L L L E L V K T E T T T P E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M G T I L D R P A D S V I Q Y G G L L S Q K G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A Q V D R A V T T T L T L T E E G T Q Y L K E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L P E R Q L Y D S F S E S A S I A D L N T H P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A K I G L G W M K R L G W V K I E A G N V I K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G D P A P S P I E L A L K N P D A A P A D I K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D L L K R G L V T E E E S V R Y T I T I T D E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K K L A A A G I T L T Q E T G T L T A D Q I S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G A W K D L S L R R Y D I T K H P R P V W P G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I H P Y Q R M I D E M R R I L L D M G F T E L H
- - - Y Q R M I D E M R R I L L D M G F T E L H
---------ATGATCCTGTGGCTGGAAAAGGGCATCAAAATTCCAGAAAGCTCCCTGAATGATGCTGCCATG
241242243244245246247248249250251252253254255256257258259260261262263264
G S I I Q G A F W N F D A L F Q P Q D H P A R E
G S I I Q - - - - - - - - - - - - - - - - - - -
TAGTTCGGTAAAACC---------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
M Q D T F H L A G K Q E L P V G W E K V R D M H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E S G G E T S S T G W G G K W D P E K A K A T V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------TCC
313314315316317318319320321322323324325326327328329330331332333334335336
L R T H T T S L S I Q H L A A H P E P P V K A F
L R T H T T S L S I - - - - - - - - - - V K A F
CTCATCGGTGATAGTGATCGTATACCGGAC------------------------------GAGAAGATCCTT
337338339340341342343344345346347348349350351352353354355356357358359360
C I G R V Y R R E A I D P T H L P E F E Q L E G
C I G R V Y R R - - - - - - - - P E F E Q L E G
CTTGATGTCAGCTGGAGCAGCATC------------------------CGGAGACGGAGCAGGATCACCGGT
361362363364365366367368369370371372373374375376377378379380381382383384
I V M D T H V N F R N L L G Y L K E F Y G R M G
I V M - - - - - F R N L L G Y L K E F Y G - - -
CTTGATGAC---------------TTTCACCCAGCCAAGCCGTTTCATCCAGCCAAGACCGAT---------
385386387388389390391392393394395396397398399400401402403404405406407408
F E S V R F R P G Y F P Y T E P S V E P E V Y I
- - - - - - - - - - - - - - - - S V E P E V - -
------------------------------------------------ATAGAGCTGCCGTTCAGG------
409410411412413414415416417418419420421422423424425426427428429430431432
E G L G W V E L G G A G I F R E E V T A P W G I
- - - - - - E L G G A G I F - - - - - - - - - -
------------------TCCTTCCTCGGTCAGAGTAAGTGT------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T C P V L A W G L G V S R V A M L R M G L T D L
- C P V L A W G L G V S R V A M L - - - - - - -
---TTTCTGGGACAAGAGTCCTCCATATTGAATGACTGAATCAGCAGGCCG---------------------
457458459460461462463464465466467468469470471472473474475476477478
R E L Y Q S D I D W V R N V P V V Q G G R C
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_pheALPHA_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E D F K L H N D E K K L L K I F Q E A Y D N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N I T K L S V E G L A K N E L M G S E T K V M R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T A L W L S A E D K K L V N I I E N K S K I A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L T E E G K K V V E K G L P E R Q V A N Y M I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
N D L K N I P I K E L G N I L D K S E V N P A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G N L K K K K I A K I E K G N I I I E N L Q Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D K E E N T L N K I K I N E E N K N S D L N N Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N D E E K K L I N N L Q K R G F I A I E E E V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R A I E L T E K G I E F I K N N I I E I K E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S Q L T R E H I V S G K W K D C H I R P Y D A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I P S E E V Y P A K L H P M T R I I N D V K E V
- - - - - - - - - - - - P M T R I I N D V K E V
------------------------------------TTTAACATCATTTATAATTCGTGTCATAGGGTGTAA
265266267268269270271272273274275276277278279280281282283284285286287288
L I G M G F K E V K N P I V E T E F W N F D V L
L I G M G F K E V K N P I V E - - - - - - - - -
TTTAGCAGGATATACTTCCTCTGATGGTATTTTTGCATCATATGG---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F E P Q D H P A R D M Q D T F F L R Y P N K G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I P E M V K D I K S I H E K G M V G D K K I S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G W R Y E F D E E I S K K T V L R T H T T V S S
- - - - - - - - - - - - - - V L R T H T T V S S
------------------------------------------ATCGCTGTTTTTGTTTTCTTCATTTATTTT
361362363364365366367368369370371372373374375376377378379380381382383384
I K Y L A S L T D E E K E K P H K I F S I D R V
I - - - - - - - - - - - - - - H K I F S I D R V
TAT------------------------------------------TTCAATTATTATATTTCCTTTTTCTAT
385386387388389390391392393394395396397398399400401402403404405406407408
F R N E A I D Y S H L P E F Y Q C E G I I L A E
F R N - - - - - - - - P E F Y Q C E G I I L - -
TTTAGCTAT------------------------TGCAGGATTTACTTCTGATTTGTCTAAAATATT------
409410411412413414415416417418419420421422423424425426427428429430431432
G V H F D N L I G L L K E F L N R L G F E Q V R
- - - F D N L I G L L K E F L N - - - - - - - -
---------TGGGATATTTTTTAAATCATTTTCAATCATATAATTTGC------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I R P A Y F P F T E P S L E A E V F V E G R G W
- - - - - - - - - - - S L E A E V - - - - - - -
---------------------------------GGCAATTTTTGATTTATT---------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L E L L G A G V F R P E V V E P L G I N K P V L
- E L L G A G V F - - - - - - - - - - - K P V L
---ATCTTCCGCAGATAACCAAAGAGC---------------------------------CTCATTTTTTGC
481482483484485486487488489490491492493494495496497498499500501502503504
A W G I G L S R L A M L R W G L T D I R E L H K
A W G I G L S R L A M L - - - - - - - - - - - -
TAATCCCTCAACAGATAATTTTGTAATATTTTTATT------------------------------------
505506507508509510511512513
N E L N W L K K A
- - - - - - - - -
---------------------------
Class II
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_pheALPHA_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E L H I D E K R L L K I F Q D N N R D E F N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N E L E K F M P K E K I L R V S L W L K G K N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V E T E E K V K K I I K L I K E E E F P E R K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A N Y L K Q H N I K E I E I K N L K D I L P K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E I N A A L G A I K R K G I A R I E K G K I I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D N L D Y K D V E E Q L L Q K I K E N K Y L D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
F S E E E K K I I D I L K K R G Y V D F D E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E I K I K L T E K G K E F I K N P I E I E E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T Q L T R D I I I S G K W K K A Y I R P Y D V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V P T K P I Y P A K V H P L T R I I R E V K E I
- - - - - - - - - - - - P L T R I I R E V K E I
------------------------------------CCATTGACAAGAATTATTAGAGAGGTTAAAGAGATT
241242243244245246247248249250251252253254255256257258259260261262263264
L L A M G F K E V K S P I V E T E F W N F D M L
L L A M G F K E V K S - I V E - - - - - - - - -
TTATTAGCTATGGGATTTAAAGAAGTGAAAAGC---ATTGTAGAA---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F E P Q D H P A R E M Q D T F F L K Y P N E G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I P E D L L S K V K E V H E R C W K Y K F D E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V S R R L I L R T H T T A S S I R Y L A S L S D
- - - - - I L R T H T T A S S I - - - - - - - -
---------------ATTTTAAGAACTCATACCACTGCATCATCAATA------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
E E K N K P H K V F C I D R V F R N E A I D Y K
- - - - - - H K V F C I D R V F R N - - - - - -
------------------CACAAGGTATTTTGTATAGATAGAGTATTTAGAAAT------------------
361362363364365366367368369370371372373374375376377378379380381382383384
H L P E F Y Q C E G I I M D D N V N F N N L I G
- - P E F Y Q C E G I I M - - - - - F N N L I G
------CCAGAGTTTTATCAGTGTGAAGGAATTATAATG---------------TTTAACAACCTAATTGGA
385386387388389390391392393394395396397398399400401402403404405406407408
V L K E F L N R L G F E K V R F R P A Y F P F T
V L K E F L N - - - - - - - - - - - - - - - - -
GTTTTAAAAGAATTCTTAAAT---------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E P S L E A E V Y L E G K G W L E I L G A G I F
- - S L E A E V - - - - - - - - E I L G A G I F
------TCCTTAGAGGCAGAGGTT------------------------GAAATCTTAGGAGCAGGAATATTT
433434435436437438439440441442443444445446447448449450451452453454455456
R P E V L E P I G I E K P V L A W G I G F S R L
- - - - - - - - - - - K P V L A W G I G F S R L
---------------------------------AAGCCAGTTTTAGCTTGGGGTATTGGGTTTAGTAGATTA
457458459460461462463464465466467468469470471472473474475476477478479480
A M L R Y G L T D I R D L H K N D L D W L K R V
A M L - - - - - - - - - - - - - - - - - - - - -
GCAATGCTT---------------------------------------------------------------
Class II
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_pheALPHA_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D P R E L A E R L T E R D L R I L I H L A E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G E A T P E E L A E S L D V D L G P V M R S L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W L E E R G L I E S E E E T H E V Y E L G D E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K E Y A E E G L P E L R I V E V L R K I G G E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R L E E V L D R A G V P R K L A G P V L G W L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
R K G L A E I K R E D G E T S L V L L E E E P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D V D Q S V L E A L A A E G S A S V E E L A R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L E M D E E E V E K A L K R L S E R G D V L R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R E E T V K K V R L T E R G E E V A E H A P E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L E R D W I T E L K P E H L R E G T W K E K E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K P Y D V K A P T S P T F P G K R H P L K E V I
- - - - - - - - - - - - - - - - - - P L K E V I
------------------------------------------------------CCACTGAAGGAGGTTATC
265266267268269270271272273274275276277278279280281282283284285286287288
N E I R R I F L E M G F V E V S G P L V E S S F
N E I R R I F L E M G F V E V S G P L V E - - -
AACGAGATACGTAGGATCTTCCTCGAGATGGGTTTCGTGGAGGTGTCCGGACCGCTGGTCGAG---------
289290291292293294295296297298299300301302303304305306307308309310311312
W N F D A L F Q P Q D H A A R E M Q D T F Y L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E P A E A E L P D E E V V E K V R A V H E D G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D T G S R G W G Y E W D E G V A R K T V L R T H
- - - - - - - - - - - - - - - - - - - V L R T H
---------------------------------------------------------GTCCTTCGTACTCAC
361362363364365366367368369370371372373374375376377378379380381382383384
T T A V S V R K L Y E V E G P P L K A F S I G R
T T A V S V - - - - - - - - - - L K A F S I G R
ACGACGGCGGTGTCGGTT------------------------------CTCAAAGCGTTCTCGATCGGCCGG
385386387388389390391392393394395396397398399400401402403404405406407408
V Y R R E T V D Y K H L P E F H Q C E G I V L A
V Y R R - - - - - - - - P E F H Q C E G I V L -
GTGTACCGGCGC------------------------CCGGAGTTCCATCAGTGTGAGGGAATAGTCCTG---
409410411412413414415416417418419420421422423424425426427428429430431432
K D V S F R D L L G I L E E F Y R R M G F E E V
- - - - F R D L L G I L E E F Y R - - - - - - -
------------TTCCGGGACTTGCTCGGGATACTCGAGGAGTTCTACCGA---------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R F R P A Y F P Y T V L S V E P E V Y F E E K G
- - - - - - - - - - - - S V E P E V - - - - - -
------------------------------------TCCGTCGAACCCGAGGTA------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D W V E L G G A G I F R P E V L Q P L G F D P D
- - - E L G G A G I F - - - - - - - - - - - - -
---------GAGCTAGGCGGTGCGGGCATTTTC---------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
V V C L A W G L G V E R L A M L K L G I D D I R
V V C L A W G L G V E R L A M L - - - - - - - -
GTGGTGTGTTTAGCATGGGGCTTGGGCGTCGAACGACTGGCGATGCTG------------------------
505506507508509510511512513514515516517518519520521522523524
D L Y M S D L K T L L E L P T A R A R R
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_pheALPHA_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M M D L D R I I D Q L H I Y E K K V L K A F E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S D K P L K P E E I A E S Q K I D I K S V M S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S G A L E S R G F V R V M K D A D E V V S L T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D G E S C A R E G L P E R R L I E A L K G E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E M S E L S R R A G L D K K E A G I G I G W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
M R K G W G R I S Q G M V S A V S D E T P E R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A D E R L L E L L L E R G S V R I R E L P D E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R G A L K D L K G R K G I V D I R K I K R H T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E L T T E G R K L L E R G I E I V E E A T Q V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H E H L K S G A W R K L H Y R G Y N I D A E Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L V Y P G K M H P L R R I I D E I R S I F L K L
- - - - - - - - P L R R I I D E I R S I F L K L
------------------------AAGTTTAAGGAATATTGACCTTATCTCATCGATTATGCGCCTCAGAGG
265266267268269270271272273274275276277278279280281282283284285286287288
G F T E S R G P I V E S A F W N F D C L F Q P Q
G F T E S R G P I V E - - - - - - - - - - - - -
GTGCATCTTTCCAGGGTAGACCAGAGGGTACTC---------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D H A A R E M Q D T F Y V K N P A V T D L P C E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D L V R A V Q D A H E T G G S T G S E G W Q Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
W D R D V A R Q S V L R T H T T C V S A R F L S
- - - - - - - - - V L R T H T T C V S A - - - -
---------------------------TTCATCAGGGAGTTCTCTGATCCTCACGGATCC------------
361362363364365366367368369370371372373374375376377378379380381382383384
E N E P P L K M F S V G R V F R R E T I T Y K H
- - - - - L K M F S V G R V F R R - - - - - - -
---------------CTCATCCGCACCCCTTTCAGGTGTTTCATCGCTCAC---------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L P E F H Q V E G I V A G D E V N F R N L L G I
- P E F H Q V E G I V A - - - - - F R N L L G I
---CCTCCCCCATCCCTTCCTCATGAGCCAGCCAAT---------------TTTCTTATCAAGACCCGCTCT
409410411412413414415416417418419420421422423424425426427428429430431432
L R E F Y R K L G F E V R F R P A Y F P Y T Y L
L R E F Y R - - - - - - - - - - - - - - - - - -
CCTGGAAAGTTCTGACAT------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S T E C E I Y L P E K K S W I E L G G A G M F R
S T E C E I - - - - - - - - - E L G G A G M F -
CTCCCTGGCACAGGACTC---------------------------ATCCGCGTCCTTCATAACCCTCAC---
457458459460461462463464465466467468469470471472473474475476477478479480
P E V L E P L G V E T P V A A F G L G I E R L A
- - - - - - - - - - T P V A A F G L G I E R L A
------------------------------CATGACAGATTTTATATCAATTTTCTGGGATTCTGCTATTTC
481482483484485486487488489490491492493494495496497498499500501502503504
M I R F D I K D I R M L Y Q S D L G W L R G L P
M I - - - - - - - - - - - - - - - - - - - - - -
TTCAGG------------------------------------------------------------------
505506507508509510511
V T G D L E L
- - - - - - -
---------------------
Class II
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_pheALPHA_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T D Q P S N L V T Q L E T L R Q E A Q T A I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A A D C L E R L E E L R V A Y L G K K G Q L S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I M R Q M G Q L S A E E R P Q F G S I A N T V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E A V Q A N L D D R R T K L Q A A R L Q A K L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E T I D V T M P G V F R P L G H A H P L N S T
- - - - - - - - - - - - - - - - - - - P L N S T
---------------------------------------------------------TTCTATCTGATGGAA
121122123124125126127128129130131132133134135136137138139140141142143144
T D R I I D I F V G L G Y T V A T G P E I E S D
T D R I I D I F V G L G Y T V A T G P E I E - -
AACTGCGGCATGGGTAGCATCTACAGTATCTCGCCGATAGCAGCGACCTGGAACCACAATTCGCAC------
145146147148149150151152153154155156157158159160161162163164165166167168
Y Y N F E A L N F L P D H P A R D M Q D T L Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P D G N L L R T H T S N G Q I H Y M E D N E P P
- - - - L L R T H T S N G Q I - - - - - - - - -
------------CATATCCCGTGCTGGATGGTCGGGTAAGAAATT---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V R I V V P G R C Y R R D T V D A T H A A V F H
V R I V V P G R C Y R R - - - - - - - - A V F H
TTCGATTTCCGGTCCCGTCGCTACGGTGTAACCCAG------------------------GTCAGTAGTACT
217218219220221222223224225226227228229230231232233234235236237238239240
Q I E F F A V D E G I T F T D L K G T I Q I F L
Q I E F F A V - - - - - F T D L K G T I Q I F L
GTTGAGGGGATGGGCGTGACC---------------CCCAGGCATAGTCACATCTATAGTTTCAGATTCTAA
241242243244245246247248249250251252253254255256257258259260261262263264
Q E M F G D V P I R F R A S Y F P F T E P S A E
Q - - - - - - - - - - - - - - - - - - - - S A E
TTT------------------------------------------------------------TTCTTTAAC
265266267268269270271272273274275276277278279280281282283284285286287288
V D V Q W K G R W L E V M G C G A I D P N V L K
V D V - - - - - - - E V M G C G A I - - - - - -
GGTGTTGGC---------------------TTCTTCAGCTGAGAGCTGACCCAT------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A V G Y D P E V Y T G F A A G M G V E R L A M V
- - - - - - - - Y T G F A A G M G V E R L A M V
------------------------TGCTACTCTGAGTTCCTCCAATCGCTCCAGGCAATCGGCAGCAGCGAT
313314315316317318319320321322323324325326327328329330331332333
L H Q I D D I R R F Y S S D L R F L R Q F
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_pheALPHA_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L Q Q L D L I Q H E I E Q Y H P T T L Q E L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E F R I K F L S K K G T I T Q L F T E F G Q L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P A D K Q A L G S K L N A L K Q I A Q E K Y K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y A S Q L Q S T P K Q N T D V N E D Y T L P P P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A D K L G S R H P I S I L K D R I L E I F E K I
- - - - - - - - P I S I L K D R I L E I F E K I
------------------------ATCTTCTCCAAATAAGCTACGTAAAAAATATAAAAGCACTTGTTTAAG
121122123124125126127128129130131132133134135136137138139140141142143144
G F S I V E G P E I E D D W H N F G A L N F S P
G F S I V E G P E I E - - - - - - - - - - - - -
TTCTACAAAGCTTACATTCTTATTAACATAGAA---------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N H P A R D M L D T F F I S Q C P D I L L R T H
- - - - - - - - - - - - - - - - - - - L L R T H
---------------------------------------------------------ACTCTCAGCCACCCG
169170171172173174175176177178179180181182183184185186187188189190191192
T S S V Q I R V A E S Q A P P I R A I S I G R V
T S S V Q I - - - - - - - - - I R A I S I G R V
TATCTGCACAGAAGAGGT---------------------------CTGAGAAATGAAAAAAGTATCTAACAT
193194195196197198199200201202203204205206207208209210211212213214215216
Y R N E T I S A R S H C M F H Q V D A F Y V N K
Y R N - - - - - - - - C M F H Q V D A F Y V - -
ATCCCTGGC------------------------CGCTCCGAAATTATGCCAATCATCTTCTATTTC------
217218219220221222223224225226227228229230231232233234235236237238239240
N V S F V E L K Q V L L Y F L R S L F G E D I K
- - - F V E L K Q V L L Y F L R - - - - - - - -
---------ACTAAATCCAATTTTTTCAAATATTTCTAAAATTCTATC------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
M R I R P S Y F P F T E P S V E I D I N C R I C
- - - - - - - - - - - - - S V E I D I - - - - -
---------------------------------------CTCATTTACATCTGTATT---------------
265266267268269270271272273274275276277278279280281282283284285286287288
N G N G C N I C K H S G W L E I M G A G M I D P
- - - - - - - - - - - - - - E I M G A G M I - -
------------------------------------------TTGTTTTAATGCATTTAGCTTACT------
289290291292293294295296297298299300301302303304305306307308309310311312
N V L K N C H I D P T T Y T G Y A F G M G L E R
- - - - - - - - - - - - Y T G Y A F G M G L E R
------------------------------------AGTAAAAAGCTGAGTAATAGTTCCCTTCTTACTTAG
313314315316317318319320321322323324325326327328329330331332333334335336
I A M L M Y Q I N D L R L F T E N D V R F L K Q
I A M L - - - - - - - - - - - - - - - - - - - -
AAATTTTATGCG------------------------------------------------------------
337338339340341
F K A Y A
- - - - -
---------------
Class II
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_pheALPHA_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q D T A I Q E I Q G A E T L E A L Q A V K T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y V G K S G L V T K E L G S L G K L P P E E R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A C G A E I N V V R A A I Q A A L D E K E S A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K R A A L D A K L A S E A I D V T L P G L P L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A G G L H P I S R V L D D L I G I Y R Q M G Y A
- - - - - P I S R V L D D L I G I Y R Q M G Y A
---------------CCCATTTCCCGCGTGCTCGACGACCTGATCGGCATCTACCGCCAGATGGGCTACGCG
121122123124125126127128129130131132133134135136137138139140141142143144
V I E G P E V E E E H Y N F E A L N V P W Y H P
V I E G P E V E - - - - - - - - - - - - - - - -
GTGATCGAGGGGCCGGAAGTCGAG------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A R D L Q D T F W L E D G R L L R T H T S P M Q
- - - - - - - - - - - - - - L L R T H T S P M Q
------------------------------------------CTGCTGCGCACCCACACCTCGCCCATGCAG
169170171172173174175176177178179180181182183184185186187188189190191192
I R Y M V D H E P P F K I V V R G K V Y R Y E A
I - - - - - - - - - F K I V V R G K V Y R Y - -
ATT---------------------------TTCAAGATCGTGGTGCGCGGCAAGGTCTACCGCTAC------
193194195196197198199200201202203204205206207208209210211212213214215216
T D A T H E A M F H Q L E G L V V G D G I S M S
- - - - - - A M F H Q L E G L V V - - - - - M S
------------------GCGATGTTTCACCAACTGGAAGGGCTGGTGGTG---------------ATGAGC
217218219220221222223224225226227228229230231232233234235236237238239240
D L K G T I A E M A R G L Y G A S A K A R F Q P
D L K G T I A E M A R - - - - - - - - - - - - -
GACCTCAAGGGGACCATTGCCGAAATGGCGCGC---------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S Y Y P F V E P G A D F A V Y W E N P R G E S K
- - - - - - - - G A D F A V - - - - - - - - - -
------------------------GGCGCCGACTTCGCCGTG------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
W L E L G G C G M V H P N V F K A V D D L R E A
- - E L G G C G M V - - - - - - - - - - - - - -
------GAACTGGGCGGCTGCGGCATGGTG------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A G K D R V Y E G K T G F A F G L G L E R I A M
- - - - - - - - - K T G F A F G L G L E R I A M
---------------------------AAAACCGGCTTCGCGTTCGGGCTGGGGCTGGAGCGCATCGCCATG
313314315316317318319320321322323324325326327328329330331332333334335336
L K Y G I P D I R Y F Y A N D P R V I G Q F R G
L - - - - - - - - - - - - - - - - - - - - - - -
CTG---------------------------------------------------------------------
337338339
E L G
- - -
---------
Class II
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_pheALPHA_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A D A T P L D D L K Q L E E Q A L T Q L Q Q C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A D E T A L R A W N T Q Y F G D K G V M K T A M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S N L G K I P K D Q K P A Y G A E L N R I K A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I T T A Y E A A L A E A K E K A L Q V S L T T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P L D V T L P G R A P A R G R L H P A T Q I L R
- - - - - - - - - - - - - - - - - P A T Q I L R
---------------------------------------------------GCCCTTCAGGTCGGCCATCGT
121122123124125126127128129130131132133134135136137138139140141142143144
Q I Y S I F A D L G F Q V Y R T R E V E T D E L
Q I Y S I F A D L G F Q V Y R T R E V E - - - -
CACGCCCTCGCCGACCACCAAGCCCTCCACCTGGTAGAACTGGATCTCGCTCCGGGTGCT------------
145146147148149150151152153154155156157158159160161162163164165166167168
N F E F L N M P A H H P A R D M W D T F F T T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P G V V L R T H T S P G Q I H V M R E A A G K P
- - - V L R T H T S P G Q I - - - - - - - - - -
---------GTGCGTGCGAAGCACGACGCCCGGCGTGGTGGT------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V R V I L P G M C Y R N E A I S T R S E I Q F Y
V R V I L P G M C Y R N - - - - - - - - I Q F Y
GTGGTGCGCGGGCATGTTCAGGAACTCGAAGTTCAG------------------------GCGGTACACCTG
217218219220221222223224225226227228229230231232233234235236237238239240
Q V E G L V V G E G V T M A D L K G T I T A F A
Q V E G L V V - - - - - M A D L K G T I T A F A
GAACCCGAGGTCGGCGAAGAT---------------GAGGATTTGGGTCGCGGGGTGCAACCGCCCCCGTGC
241242243244245246247248249250251252253254255256257258259260261262263264
R R M F G P E R Q V R I R S S Y F P F T E P S I
R - - - - - - - - - - - - - - - - - - - - - S I
CGG---------------------------------------------------------------TTTCGC
265266267268269270271272273274275276277278279280281282283284285286287288
E V D I D W P K D D P N R D R L T K G T G W L E
E V D I - - - - - - - - - - - - - - - - - - - E
CTCCGCGAGGGC---------------------------------------------------------CGG
289290291292293294295296297298299300301302303304305306307308309310311312
I L G A G M V H P N V L R A G G Y D P E K V T G
I L G A G M V - - - - - - - - - - - - - - V T G
TTTTTGGTCCTTCGGGATCTT------------------------------------------AAAATACTG
313314315316317318319320321322323324325326327328329330331332333334335336
F A F G M G P Q R M L M L K H A I D D I R L F W
F A F G M G P Q R M L M L - - - - - - - - - - -
CGTGTTCCAGGCGCGGAGCGCGGTTTCGTCCGCGCATTG---------------------------------
337338339340341342343344345346
Q N D L R F L K Q F
- - - - - - - - - -
------------------------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_pheALPHA_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M F E Q L D Q I E K E A A A A L A S V Q S L D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A A W R T Q W T G K K G A L A Q A S Q S I G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L D P K D R P A F G Q R F G A I K Q A L S E Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T T L E A R L Q S A A L H Q E L E E D A V D I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L P G R A A N I G R L H P S T Q S L R R I Q H I
- - - - - - - - - - - - P S T Q S L R R I Q H I
------------------------------------CCCAGCACTCAATCGCTGCGCCGAATTCAGCATATT
121122123124125126127128129130131132133134135136137138139140141142143144
F A E M G F Q V W E S R E V E S D E Y N F E L L
F A E M G F Q V W E S R E V E - - - - - - - - -
TTTGCTGAAATGGGCTTTCAAGTCTGGGAAAGCCGCGAAGTCGAA---------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N M P A H H P A R D M W D T F Y V Q S D D P H Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K V V L R T H T S P G Q I H V M R T L N P E P I
- - V L R T H T S P G Q I - - - - - - - - - - I
------GTGTTGCGCACCCACACCTCGCCTGGCCAAATT------------------------------ATT
193194195196197198199200201202203204205206207208209210211212213214215216
R V I L P G K C Y R Y E P V S A R S E M M F H Q
R V I L P G K C Y R Y - - - - - - - - M M F H Q
CGGGTGATTTTGCCTGGTAAGTGCTATCGCTAC------------------------ATGATGTTCCATCAA
217218219220221222223224225226227228229230231232233234235236237238239240
V E G L V I G K N I T M A D L K G T L A N F A R
V E G L V I - - - - - M A D L K G T L A N F A R
GTTGAAGGCTTGGTGATC---------------ATGGCCGACCTCAAAGGTACCTTGGCCAACTTTGCGCGG
241242243244245246247248249250251252253254255256257258259260261262263264
R M F K D D V K V R Y R P S Y F P F T E P S V E
- - - - - - - - - - - - - - - - - - - - - S V E
---------------------------------------------------------------AGCGTCGAA
265266267268269270271272273274275276277278279280281282283284285286287288
V D I E C F I C G G E G C R I C K K S G W L E I
V D I - - - - - - - - - - - - - - - - - - - E I
GTCGATATC---------------------------------------------------------GAAATT
289290291292293294295296297298299300301302303304305306307308309310311312
L G A G M V H P T V L R N G G Y D P A E W S G F
L G A G M V - - - - - - - - - - - - - - W S G F
CTGGGCGCAGGGATGGTG------------------------------------------TGGAGCGGCTTT
313314315316317318319320321322323324325326327328329330331332333334335336
A F G M G P E R Q T M L R Y D I D D I R W F F S
A F G M G P E R Q T M L - - - - - - - - - - - -
GCCTTTGGGATGGGGCCAGAACGCCAAACCATGCTG------------------------------------
337338339340341342343344345346
N D G R F L E Q F G
- - - - - - - - - -
------------------------------
Class II
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_pheALPHA_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K K N L T N L R I E T L E D L K I A K S N F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N N D L E L K Q L M N D L K L A S K E Q K A S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G Q K I N F Y K Q E I E Q F F L T K K E E I E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K E V L K K I Q D E F I D V F E E V N F S S S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H P L T L I E N R F R T W F L N N G Y Y E T E G
- P L T L I E N R F R T W F L N N G Y Y E T E G
---TTCTTCAAAAACATAACTAAGTAAAGATTTTAATAATCACATTAAATTTGGAAAATTATACTTTCCTGC
121122123124125126127128129130131132133134135136137138139140141142143144
S E I T T D K I N F E L L N I P K D H P S R D M
S E I T - - - - - - - - - - - - - - - - - - - -
AACAATTACATC------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q D S L Y L E K E Q N G D Q L L L R T H N T G F
- - - - - - - - - - - - - - - L L R T H N T G F
---------------------------------------------AATAATACTAAAACCTGTATTATGAGT
169170171172173174175176177178179180181182183184185186187188189190191192
S I I E L I K N K N K A F S A F S I G K V Y R N
S I - - - - - - - - - - F S A F S I G K V Y R N
TCTTAA------------------------------TAAATATAAAGAATCTTGCATATCTCTTGAAGGATG
193194195196197198199200201202203204205206207208209210211212213214215216
D E D D N T H S H Q F S Q V D V I V A G K Y N F
- - - - - - - - H Q F S Q V D V I V A - - - - F
------------------------AAAATTAATTTTATCAGTTGTGATTTCGCTTCC------------ATA
217218219220221222223224225226227228229230231232233234235236237238239240
P N L M W L L K S L L S Y V F E E E V K I R L R
P N L M W L L K S L L S - - - - - - - - - - - -
ACCATTATTTAAAAACCAAGTTCTAAAACGATTTTC------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P S Y F P F T E P S C E V D V F Y K N K W I E V
- - - - - - - - - S C E V D V - - - - - - - E V
---------------------------ATCTTGAATTTTTTTAAG---------------------TTCTTT
265266267268269270271272273274275276277278279280281282283284285286287288
L G S G I I H E N V M K A A G Y T N D M N A L A
L G S G I I - - - - - - - - - - - - - M N A L A
TTTTGTTAAAAAAAATTG---------------------------------------TGATGCTTTTTGTTC
289290291292293294295296297298299300301302303304305306307308309310311312
W G I G I E R I A M I K Y G I D N I R E F Y K N
W G I G I E R I A M I - - - - - - - - - - - - -
TTTAGAAGCAAGTTTTAAATCATTCATCAACTG---------------------------------------
313314315316317318319320321322323324325326327328329
D I R F L K Q F N L E I E K L E V
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Phycisphaera mikurensis/amino acid sequences/Pmikurensis_pheALPHA_aa
Bacteria/Phycisphaera mikurensis/nucleotide sequences/Pmikurensis_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V E T V E R V V E R A E A D L A G V A D A A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L E R F R A A W L G P K G E M K K L L G G I G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V P A A D R R A F G Q A A N A A R Q K L Q E A F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E A R R E A L G G S V K T K R S G P P L D L T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P P I L P E T G R R H V I S Q T V D E L L E V F
- - - - - - - - - - - V I S Q T V D E L L E V F
---------------------------------GAGGTCGACCATCGTCACGCCCCGGTCGACGCAGAGCCC
121122123124125126127128129130131132133134135136137138139140141142143144
G R M G F D V A E G P E L E D D R H N F V A L N
G R M G F D V A E G P E L E - - - - - - - - - -
CTCGATCTGGTGGAACATCGAGGTGTGCGTCGCGTCGTGCTC------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I P E S H P A R D P L D N F Y V A E E G V A P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F S T S L M R S Q T S T V Q I R V L E H T K P P
- - - - L M R S Q T S T V Q I - - - - - - - - -
------------GGGCGCGACGCCCTCCTCCGCAACGTAGAAGTT---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V R I V S T G R V Y R P D E H D A T H T S M F H
V R I V S T G R V Y R P - - - - - - - - S M F H
CTCGGGGATGTTGAGCGCGACGAAGTTGTGCCGGTC------------------------GACGTCGAAGCC
217218219220221222223224225226227228229230231232233234235236237238239240
Q I E G L C V D R G V T M V D L K T T L I Q F A
Q I E G L C V - - - - - M V D L K T T L I Q F A
CATGCGACCGAAAACCTCGAG---------------CTGCGAGATGACGTGCCGGCGGCCGGTCTCCGGGAG
241242243244245246247248249250251252253254255256257258259260261262263264
K A V F G A D A E V K L V P S Y F P F T E P S A
K - - - - - - - - - - - - - - - - - - - - - S A
GAT---------------------------------------------------------------CTCCCG
265266267268269270271272273274275276277278279280281282283284285286287288
E L Y V K M D F G K G P E W M E I G G C G M V D
E L Y V - - - - - - - - - - - E I G G C G M V -
TCTCGCCTCGAA---------------------------------GGCCTGCCCGAAGGCCCGGCGGTC---
289290291292293294295296297298299300301302303304305306307308309310311312
P A V L G H V D V D P E E W T G F A F G L G I E
- - - - - - - - - - - - - W T G F A F G L G I E
---------------------------------------CTCGCCCTTGGGGCCGAGCCACGCGGCGCGGAA
313314315316317318319320321322323324325326327328329330331332333334335336
R L V M R K H D I A D I R W L Y E N D R R F L R
R L V M R - - - - - - - - - - - - - - - - - - -
CCGCTCCAGGCCCGC---------------------------------------------------------
337338
R F
- -
------
Class II
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_pheALPHA_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E Q Q T M S E L K Q Q A L V D I N E A N D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R A L Q E V K V K Y L G K K G S V S G L M K L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K D L P N E E K P A F G Q K V N E L R Q T I Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E L D E R Q Q M L V K E K L N K Q L A E E T I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V S L P G R H I E I G S K H P L T R T I E E I E
- - - - - - - - - - - - - - P L T R T I E E I E
------------------------------------------CCATTAACACGTACAATAGAAGAAATTGAA
121122123124125126127128129130131132133134135136137138139140141142143144
D L F L G L G Y E I V N G Y E V E Q D H Y N F E
D L F L G L G Y E I V N G Y E V E - - - - - - -
GACTTATTCTTAGGTTTAGGTTATGAAATTGTCAATGGATATGAAGTTGAA---------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M L N L P K S H P A R D M Q D S F Y I T D E I L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------TTA
169170171172173174175176177178179180181182183184185186187188189190191192
L R T H T S P V Q A R T M E S R H G Q G P V K I
L R T H T S P V Q A - - - - - - - - - - - V K I
TTACGTACGCATACATCACCAGTGCAAGCA---------------------------------GTTAAAATT
193194195196197198199200201202203204205206207208209210211212213214215216
I C P G K V Y R R D S D D A T H S H Q F T Q I E
I C P G K V Y R R - - - - - - - - H Q F T Q I E
ATTTGCCCTGGTAAAGTGTATCGTCGT------------------------CATCAATTTACACAAATTGAA
217218219220221222223224225226227228229230231232233234235236237238239240
G L V V D K N V K M S D L K G T L E L L A K K L
G L V V - - - - - M S D L K G T L E L L A K - -
GGATTAGTTGTT---------------ATGAGTGATTTGAAAGGTACTTTAGAATTGTTAGCTAAG------
241242243244245246247248249250251252253254255256257258259260261262263264
F G A D R E I R L R P S Y F P F T E P S V E V D
- - - - - - - - - - - - - - - - - - - S V E V D
---------------------------------------------------------TCTGTAGAAGTTGAT
265266267268269270271272273274275276277278279280281282283284285286287288
V S C F K C K G K G C N V C K H T G W I E I L G
V - - - - - - - - - - - - - - - - - - - E I L G
GTG---------------------------------------------------------GAAATTTTAGGC
289290291292293294295296297298299300301302303304305306307308309310311312
A G M V H P N V L E M A G F D S S E Y S G F A F
A G M V - - - - - - - - - - - - - - Y S G F A F
GCTGGAATGGTA------------------------------------------TACTCTGGATTTGCATTT
313314315316317318319320321322323324325326327328329330331332333334335336
G M G P D R I A M L K Y G I E D I R H F Y T N D
G M G P D R I A M L - - - - - - - - - - - - - -
GGTATGGGACCAGACCGTATTGCAATGTTG------------------------------------------
337338339340341342343344345346347348349350351352
V R F L D Q F K A V E D R G D M
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Mycobacterium smegmatis/amino acid sequences/Msmegmatis_pheALPHA_aa
Bacteria/Mycobacterium smegmatis/nucleotide sequences/Msmegmatis_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V R T Q G G E T A G E Q P S D L S E E A L T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A V S A A R H A F D A A G D L D A L A R A K T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H L G D R A P I A L A R Q A L A S L P K A D R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D A G K R V N V A R A E A Q R A Y D E R L A V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R A E R D A A V L V A E R I D V T L P S T R Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L G A R H P I T I L A E N I A D T F V A M G W E
- - - - - P I T I L A E N I A D T F V A M G W E
---------------CTCGACCTGATGGAACACCGGGGTGTGGGTGGAGTCGAGTTCGTCGGTGCGGAACGT
145146147148149150151152153154155156157158159160161162163164165166167168
L A E G P E V E T E Q F N F D A L N F P P D H P
L A E G P E V E - - - - - - - - - - - - - - - -
GCGGCCGATCGAGATGATGTACAC------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A R S E Q D T F Q I A P D G S R Q V L R T H T S
- - - - - - - - - - - - - - - - - V L R T H T S
---------------------------------------------------CTCGCTGCGCGCGGGGTGGTC
193194195196197198199200201202203204205206207208209210211212213214215216
P V Q I R A L L E R D L P V Y I I S I G R T F R
P V Q I - - - - - - - - - V Y I I S I G R T F R
CGGCGGGAAGTT---------------------------CTCGACCTCGGGGCCCTCGGCCAGTTCCCAGCC
217218219220221222223224225226227228229230231232233234235236237238239240
T D E L D S T H T P V F H Q V E G L A V D K G L
T - - - - - - - - P V F H Q V E G L A V - - - -
CAT------------------------CTCGGCCAGGATCGTGATGGGGTGCCGCGCACC------------
241242243244245246247248249250251252253254255256257258259260261262263264
T M A H L R G T L D A F A R A Q F G P E G R T R
- M A H L R G T L D A F A R - - - - - - - - - -
---CGACGGCAGCGTCACGTCGATGCGCTCGGCGACCAGCAC------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F R P H F F P F T E P S A E V D I W F P G K K G
- - - - - - - - - - - S A E V D I - - - - - - -
---------------------------------GCGGGCGACGTTGACACG---------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G P G W V E W G G C G M V N P N V L R A C G I D
- - - - - E W G G C G M V - - - - - - - - - - -
---------------GGCCAGCGCCTGGCGAGCCAGCGC---------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P E V Y S G F A F G M G L E R T L Q F R N G I P
- - - Y S G F A F G M G L E R T L Q F - - - - -
---------AAGCGCATCGAGGTCTCCGGCCGCGTCGAACGCATGCCGCGCCGCGCT---------------
337338339340341342343344345346347348349350351352353354355356
D M R D M V E G D V R F S L P F G V G A
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Bacteria/Escherichia coli/amino acid sequences/Ecoli_pheALPHA_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R K N M S H L A E L V A S A K A A I S Q A S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V A A L D N V R V E Y L G K K G H L T L Q M T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L R E L P P E E R P A A G A V I N E A K E Q V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q A L N A R K A E L E S A A L N A R L A A E T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D V S L P G R R I E N G G L H P V T R T I D R I
- - - - - - - - - - - - - - - P V T R T I D R I
---------------------------------------------GTTGGTATCAACAATCAGACCTTCCAT
121122123124125126127128129130131132133134135136137138139140141142143144
E S F F G E L G F T V A T G P E I E D D Y H N F
E S F F G E L G F T V A T G P E I E - - - - - -
CTGATGGAACATCGGCGTGTGAGTCTGGTCGTAGTCGTTACGATAAACGCGGCC------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D A L N I P G H H P A R A D H D T F W F D A T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L R T Q T S G V Q I R T M K A Q Q P P I R I I
L L R T Q T S G V Q I - - - - - - - - - I R I I
AAACCAGAAAGTGTCGTGGTCAGCGCGCGCCGG---------------------------GAAGTTATGATA
193194195196197198199200201202203204205206207208209210211212213214215216
A P G R V Y R N D Y D Q T H T P M F H Q M E G L
A P G R V Y R N - - - - - - - P M F H Q M E G L
ATCGTCTTCGATTTCCGGCCCGGT---------------------ACCGAAGAAACTTTCGATACGGTCGAT
217218219220221222223224225226227228229230231232233234235236237238239240
I V D T N I S F T N L K G T L H D F L R N F F E
I V - - - - - F T N L K G T L H D F L R - - - -
GGTACG---------------CCCGCCGTTTTCAATGCGACGACCCGGCAGGGAGACATC------------
241242243244245246247248249250251252253254255256257258259260261262263264
E D L Q I R F R P S Y F P F T E P S A E V D V M
- - - - - - - - - - - - - - - - - S A E V D V -
---------------------------------------------------CAGCGCCTGCTGAACCTG---
265266267268269270271272273274275276277278279280281282283284285286287288
G K N G K W L E V L G C G M V H P N V L R N V G
- - - - - - - E V L G C G M V - - - - - - - - -
---------------------ACCAGCTGCCGGACGCTCTTCTGG---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I D P E V Y S G F A F G M G M E R L T M L R Y G
- - - - - Y S G F A F G M G M E R L T M L - - -
---------------TTTTTTACCCAAATATTCGACGCGCACATTATCTAACGCGGCAACATC---------
313314315316317318319320321322323324325326327328329330331
V T D L R S F F E N D L R F L K Q F K
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_pheALPHA_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K L D K I L E E L K L L L S S V S S L K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q E V R S K F L G S K G V I K E L L K K I K E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P S E E R K E Y G K R V N L L K E E A E K L I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E K E E E L K E R E L E E K L K G E W V D L S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P P A R T V G S L H P I T V T L E R I V T I F R
- - - - - - - - - - P I T V T L E R I V T I F R
------------------------------CCCATAACAGTTACGCTCGAGAGGATTGTGACGATATTCAGA
121122123124125126127128129130131132133134135136137138139140141142143144
G M G F E V E E G P E V E R E E Y N F D M L N I
G M G F E V E E G P E V E - - - - - - - - - - -
GGAATGGGATTTGAGGTTGAGGAAGGTCCCGAGGTAGAG---------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P K E H P A R D M Q D T F Y V N R E G Y L L R T
- - - - - - - - - - - - - - - - - - - - L L R T
------------------------------------------------------------CTTCTGAGGACT
169170171172173174175176177178179180181182183184185186187188189190191192
H T S P V Q I R T M L K K K P P I Q I I A P G K
H T S P V Q I - - - - - - - - - I Q I I A P G K
CACACCTCTCCCGTCCAGATA---------------------------ATCCAGATAATAGCCCCCGGGAAG
193194195196197198199200201202203204205206207208209210211212213214215216
V Y R R D D D P T H S P M F H Q V E G L V V N E
V Y R R - - - - - - - P M F H Q V E G L V V - -
GTTTACAGGAGG---------------------CCTATGTTCCATCAGGTTGAAGGGCTTGTTGTA------
217218219220221222223224225226227228229230231232233234235236237238239240
Y A N F R H M K Y V I E E F L K K F F E T D L P
- - - F R H M K Y V I E E F L K - - - - - - - -
---------TTCAGACACATGAAGTACGTAATTGAGGAATTCCTGAAG------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V R F R T S Y F P F T E P S A E V D I G C V I C
- - - - - - - - - - - - - S A E V D I - - - - -
---------------------------------------TCCGCGGAAGTTGACATA---------------
265266267268269270271272273274275276277278279280281282283284285286287288
H Q E G C R V C K H T G W L E V M G C G M V H P
- - - - - - - - - - - - - - E V M G C G M V - -
------------------------------------------GAAGTAATGGGTTGCGGAATGGTT------
289290291292293294295296297298299300301302303304305306307308309310311312
K V L E N C G I D T D F Y Q G F A F G M G V E R
- - - - - - - - - - - - Y Q G F A F G M G V E R
------------------------------------TACCAGGGATTTGCCTTCGGAATGGGTGTTGAGAGA
313314315316317318319320321322323324325326327328329330331332333334335336
L A M L L F G I D N I K L F Y E N D L R F I K Q
L A M L - - - - - - - - - - - - - - - - - - - -
CTCGCGATGCTC------------------------------------------------------------
337338
F F
- -
------
Class II
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_pheALPHA_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q E E L K R L E K E A V E K V E A A G S L K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V N D V R V A Y L G K K G P I T E V L R G M G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L S A E E R P K M G A L A N E V R E K I A A A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A E K N A R L E E E E V K R K L K E Q T I D V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L P G S P V K T G A R H P L T I V I E E I E D L
- - - - - - - - - - - - P L T I V I E E I E D L
------------------------------------CTTTTTCGCGACCGTTTCCAGGGTTCCTTTTAAGTC
121122123124125126127128129130131132133134135136137138139140141142143144
F I S M G Y S V E E G P E V E T D Y Y N F E A L
F I S M G Y S V E E G P E V E - - - - - - - - -
GCTCATGCTGATATCACGGTCAACGCAGAGCCCTTCAATCTGCAT---------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N L P K E H P A R D M Q D S F Y I T E D T L M R
- - - - - - - - - - - - - - - - - - - - - L M R
---------------------------------------------------------------TTCCATCGT
169170171172173174175176177178179180181182183184185186187188189190191192
T Q T S P V Q T R T M E K H K G K G P V K I I C
T Q T S P V Q T - - - - - - - - - - - V K I I C
GCGCGTCTGAACAGGAGATGTCTG---------------------------------GCTGTCTTGCATATC
193194195196197198199200201202203204205206207208209210211212213214215216
P G K V Y R R D N D D A T H S H Q F M Q I E G L
P G K V Y R R - - - - - - - - H Q F M Q I E G L
CCGGGCCGGGTGCTCTTTCGG------------------------ATAGTCGGTTTCCACTTCAGGCCCCTC
217218219220221222223224225226227228229230231232233234235236237238239240
C V D R D I S M S D L K G T L E T V A K K M F G
C V - - - - - M S D L K G T L E T V A K - - - -
TTCCAC---------------GATAAACAAGTCTTCGATTTCTTCAATAACGATCGTCAG------------
241242243244245246247248249250251252253254255256257258259260261262263264
E E R E I R L R P S F F P F T E P S V E V D V S
- - - - - - - - - - - - - - - - - S V E V D V -
---------------------------------------------------CAGCTTCCTTTTCACCTC---
265266267268269270271272273274275276277278279280281282283284285286287288
C F K C G G K G C S V C K Q T G W I E I L G A G
- - - - - - - - - - - - - - - - - - E I L G A G
------------------------------------------------------TTCGTTCGCCAAGGCCCC
289290291292293294295296297298299300301302303304305306307308309310311312
M V H P N V L E M A G F D S K Q Y Q G F A F G M
M V - - - - - - - - - - - - - - Y Q G F A F G M
CATTTT------------------------------------------TTCTGTGATCGGTCCCTTTTTTCC
313314315316317318319320321322323324325326327328329330331332333334335336
G V E R I A M L K Y G I D D I R H F Y T N D V R
G V E R I A M L - - - - - - - - - - - - - - - -
CAGATACGCAACGCGGACATCGTT------------------------------------------------
337338339340341342343344
F L S Q F K Q A
- - - - - - - -
------------------------
Class II
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_pheALPHA_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D L D Q I V A D A Q Q S F E G A A D I T T L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N E K A R F L G K S G A L T E L L K G L G K L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P E A R K T E G A R I N V A K Q Q V E A A L N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R R Q A L A D A L L N Q R L A A E A I D V T L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G R G A G A G S L H P V M R T W E R V E Q I F R
- - - - - - - - - - P V M R T W E R V E Q I F R
------------------------------ATAGACGCCCTTCAGATCCGCGAAGCTGACGTTCTCGTCGAT
121122123124125126127128129130131132133134135136137138139140141142143144
S I G F D V A D G P E I E T D W Y N F T A L N S
S I G F D V A D G P E I E - - - - - - - - - - -
CCACAGGCCTTCGACCTGATTGAACATCGGGGAGTGCGT---------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P E N H P A R S M Q D T F Y V D G K D A D G R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L L R T H T S P M Q V R Y A R M N R P P I K V
- L L R T H T S P M Q V - - - - - - - - - I K V
---CAGCCGACGACCGTCCGCGTCCTTGCCGTCGAC---------------------------CGGATGGTT
193194195196197198199200201202203204205206207208209210211212213214215216
I A P G R T Y R V D S D A T H S P M F N Q V E G
I A P G R T Y R V - - - - - - - P M F N Q V E G
CTCCGGGCTGTTCAATGCGGTGAAGTT---------------------GGGGCCGTCGGCCACGTCGAAACC
217218219220221222223224225226227228229230231232233234235236237238239240
L W I D E N V S F A D L K G V Y T D F L K K F F
L W I - - - - - F A D L K G V Y T D F L K - - -
GATCGAGCG---------------GCGCTCCCACGTGCGCATCACCGGATGGAGGCTCCCCGC---------
241242243244245246247248249250251252253254255256257258259260261262263264
E R D D I L V R F R P S Y F P F T E P S A E I D
- - - - - - - - - - - - - - - - - - - S A E I D
---------------------------------------------------------GTCGGCGAGCGCCTG
265266267268269270271272273274275276277278279280281282283284285286287288
M M F E H G K N A G K W L E I S G S G Q V H P T
M - - - - - - - - - - - - E I S G S G Q V - - -
GCG------------------------------------GACATTGATGCGCGCGCCTTCCGT---------
289290291292293294295296297298299300301302303304305306307308309310311312
V I R N M G L D P E R Y I G F A F G S G L E R L
- - - - - - - - - - - Y I G F A F G S G L E R L
---------------------------------CTCGGTCAGCGCGCCCGACTTACCGAGAAACCGCGCCTT
313314315316317318319320321322323324325326327328329330331332333334335336
T M L R Y G V Q D L R L F F E N D L R F L R Q F
T M L - - - - - - - - - - - - - - - - - - - - -
CTCGTTCTC---------------------------------------------------------------
337
A
-
---
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_pheALPHA_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T T L L D E L T A L E Q E A F D A L N T V T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L T A L T E W K S R F I G K Q G R L T R L S R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L G T L P V A E R P L A G Q R V N S L R E Q L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A A F A A T K E R L E A Q A I A A E L A A E R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D I T M P G R R P A V G Y V H L T N Q I L R Q V
- - - - - - - - - - - - - - - L T N Q I L R Q V
---------------------------------------------GCTCAAAGTGCCCTTGAGATCGGCCAT
121122123124125126127128129130131132133134135136137138139140141142143144
Q Q I F A E M G F Q V W E S P E V E Y D A F N F
Q Q I F A E M G F Q V W E S P E V E - - - - - -
CGTCACACGACGACCGACTGCCAAAAACTCAAACTGGTGGAACATCATCTCGCT------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S L L N F P D D H P A R D M Q D T F Y V E M P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G A P S V L L R T H T S P G Q I H A M R K N A P
- - - - - L L R T H T S P G Q I - - - - - - - -
---------------GGTGCGTAACAGTACTGATGGCGCACCGGCCGG------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
N P L R V L I P G K V Y R N E Q V T V R S E M M
- - L R V L I P G K V Y R N - - - - - - - - M M
------GCGGGCCGGGTGGTCGTCGGGGAAATTGAGCAGGCT------------------------TTCAGG
217218219220221222223224225226227228229230231232233234235236237238239240
F H Q F E F L A V G R R V T M A D L K G T L S F
F H Q F E F L A V - - - - - M A D L K G T L S F
GCTTTCCCAAACCTGAAACCCCATTTC---------------CACTTGACGCAAAATTTGGTTGGTGAGATG
241242243244245246247248249250251252253254255256257258259260261262263264
F A E R M F G P G T Q V R L R P S Y F P F T E P
F A E - - - - - - - - - - - - - - - - - - - - -
GACATAACC---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
S A E M D V T C F L C G G K G C R I C K Y A G W
S A E M D V - - - - - - - - - - - - - - - - - -
CGCCTGGGCTTCCAACCG------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L E I G G C G M V H P N V L R N G G Y D P A E F
- E I G G C G M V - - - - - - - - - - - - - - F
---GCCGGCCAAAGGTCGTTCGGCGAC------------------------------------------CTG
313314315316317318319320321322323324325326327328329330331332333334335336
S G F A G G F G P E R V A M L K Y G I D D I R W
S G F A G G F G P E R V A M L - - - - - - - - -
CTTACCGATGAAGCGACTCTTCCATTCGGTGAGGGCTGTCAGATC---------------------------
337338339340341342343344345346347348349
F Y S G D Q R F V E Q F G
- - - - - - - - - - - - -
---------------------------------------
Class II
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_pheALPHA_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q N F I E Q I Q K C E N L N D L E A I R I S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L G K K G I L T E G F T K L K E L E D E A K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F A A K L N A Q K E I F N E A Y L A K F K D L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N L A L E E R M K Q D A L N F N Y F D E S I T T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G A L H P V M S T M D K I I E Y F I A L N F S I
- - - - P V M S T M D K I I E Y F I A L N F S I
------------TCCAAACATATAACGCAAAAAATCTTCCAATACACTTTTTAAATTTGCAAAGCTAACCTT
121122123124125126127128129130131132133134135136137138139140141142143144
E K G P L I E D D F H N F E A L N L P K S H P A
E K G P L I E - - - - - - - - - - - - - - - - -
TTGCCCTTCTTCCACCACAAG---------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R D M Q D T F Y F D D K R L L R T Q T S P V Q I
- - - - - - - - - - - - - L L R T Q T S P V Q I
---------------------------------------TTGTGCAAGCATTGTCCGTATTTGCACTGGCGA
169170171172173174175176177178179180181182183184185186187188189190191192
R T M L A Q K P P I R M I A P G A V F R R D F D
- - - - - - - - - I R M I A P G A V F R R - - -
---------------------------ATCAAAATAAAAGGTATCTTGCATATCTCTTGCGGG---------
193194195196197198199200201202203204205206207208209210211212213214215216
I T H T P M F H Q V E G L V V E E G Q K V S F A
- - - - P M F H Q V E G L V V - - - - - - - F A
------------CGCTTCAAAATTATGAAAGTCATCTTCTATTAA---------------------ATTCAA
217218219220221222223224225226227228229230231232233234235236237238239240
N L K S V L E D F L R Y M F G D V K V R F R P S
N L K S V L E D F L R - - - - - - - - - - - - -
AGCTATAAAATATTCTATGATTTTATCCATGGT---------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F F P F T E P S A E V D I S C V F C K G K G C R
- - - - - - - S A E V D I - - - - - - - - - - -
---------------------AGCATCTTGTTTCATTCT---------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V C K H T G W L E V L G C G I V D P N V Y N F V
- - - - - - - - E V L G C G I V - - - - - - - -
------------------------TATTTCTTTTTGTGCATTTAATTT------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G Y E N V S G Y A F G L G V E R F A M L L H Q I
- - - - V S G Y A F G L G V E R F A M L - - - -
------------TTTAAGCTTTGTAAAGCCTTCTGTTAAAATACCTTTTTTTCCAAGAAC------------
313314315316317318319320321322323324325326327328329330
P D L R S L F E G D L R L L E Q F R
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_pheALPHA_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T T S F Q Q L S N Q L E A L K V Q A N N D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A R A S D I S T I E K L R V S L M G K K G Q L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I I L K N M S K L P E E E R P W I G Q L A N L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K Q E V N S L I V K R I S A M K S E I M K D K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I R E T L D V T L P S I G I L S G H R H P L V K
- - - - - - - - - - - - - - - - - - - - P L V K
------------------------------------------------------------TACCTGATGAAA
121122123124125126127128129130131132133134135136137138139140141142143144
T T E D I V D I F C G L G Y R V V E G P E I E T
T T E D I V D I F C G L G Y R V V E - P E I E -
GACCGGTGAATGTGTAGCGTCGACACCATCCCTTCGATAAACTCGCCCAGGTGC---GATTCTAGTAGG---
145146147148149150151152153154155156157158159160161162163164165166167168
D Y Y N F T A L N I P K H H P A R D M Q D T F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L S E N Y L L R T H T S P V Q I R H L E K N P P
- - - - - L L R T H T S P V Q I - - - - - - - -
---------------ATCTCTAGCAGGATGATGTTTAGGAATATTGAG------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P T R I I A P G R V Y R R D G V D A T H S P V F
- T R I I A P G R V Y R R - - - - - - - - P V F
---AATCTCTGGGCCTTCCACAACACGATAACCAAGACC------------------------TGTTGTCTT
217218219220221222223224225226227228229230231232233234235236237238239240
H Q V E V L A I D E G L D F S H L R G T V M T F
H Q V E V L A I - - - - - F S H L R G T V M T F
AACAAGCGGATGACGATGACCAGA---------------AGGCAATGTTACATCTAACGTCTCGCGAATAAT
241242243244245246247248249250251252253254255256257258259260261262263264
L K Q F F G D L P V R F R A S Y F P F T E P S A
L K - - - - - - - - - - - - - - - - - - - - S A
CTTATC------------------------------------------------------------TTTCAA
265266267268269270271272273274275276277278279280281282283284285286287288
E V D V Q W Q D R W L E V M G C G M V D P A V L
E V D V - - - - - - - E V M G C G M V - - - - -
GAGGTTTGCAAG---------------------TTCCTCAGGTAATTTGCTCATATT---------------
289290291292293294295296297298299300301302303304305306307308309310311312
E G L G L D P K R W S G F A A G L G V E R F C M
- - - - - - - - - W S G F A A G L G V E R F C M
---------------------------TACTCTTAGCTTCTCGATAGTACTTATGTCGGAAGCCCTGGCTAT
313314315316317318319320321322323324325326327328329330331332333334
V R S S I D D I R R L Y T S D I R F L E Q F
V - - - - - - - - - - - - - - - - - - - - -
ATC---------------------------------------------------------------
Class II
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_pheALPHA_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_pheALPHA_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A T A C S L Y E L L R D R K S I T C K A A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L S V P H G E L I S W M K S L E A N E V L K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E L I K T T C I V L T K D G V A T L Q G G S Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y R L A S K L N D L A T S H P Q G Q G G L V K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E L S K Y F S E G D F M V G V A G C M R A K W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I R I I S S G K K D P D P G Y E L C L P L A D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S D D T Q A L L Y G L V I P G T T D L V Q E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D D D L F K Q L K Q R K L V T T A E L K H F V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S K G E K Y E A G M K K L S P D L T I E M V R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H F L N N P S T E A A A K A G T P S F G F S I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P L N F E S L G S V P H A G A F H P L M E M R R
- - - - - - - - - - - - - - - - - P L M E M R R
---------------------------------------------------CCGCTGATGGAAATGCGAAGA
265266267268269270271272273274275276277278279280281282283284285286287288
L F V E A F V G M G F E Q M K T P K L V E S S F
L F V E A F V G M G F E Q M K T . K L V E - - -
CTATTCGTCGAGGCGTTTGTTGGAATGGGTTTTGAGCAGATGAAGACA---AAGCTGGTTGAA---------
289290291292293294295296297298299300301302303304305306307308309310311312
W N F D A L F Q P Q S H P A R D S Q D T F F V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G Q Y S Q T R R D S L D A E L V E R I R T A H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S G G E A M R S K G Y R Y V W K V S E A L R N V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GTT
361362363364365366367368369370371372373374375376377378379380381382383384
L R T H T T A V S A R V L Y E I G Q H Y Q K T G
L R T H T T A V S A - - - - - - - - - - - - - -
CTCCGCACGCACACTACTGCCGTCTCAGCC------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E F R P R R F F S I D R V Y R N E T L D A T H L
- - - - R R F F S I D R V Y R N - - - - - - - -
------------CGCCGCTTCTTCTCTATTGACAGGGTTTATCGCAAC------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
C E F N Q V E G M V I D R N L T L G N L I A T L
C E F N Q V E G M V I - - - - - L G N L I A T L
TGTGAGTTTAACCAGGTGGAAGGAATGGTTATT---------------CTTGGAAACCTTATCGCGACTCTC
433434435436437438439440441442443444445446447448449450451452453454455456
R A F F A R L G M T Q L K F K A T Y N P Y T A P
R A F F A - - - - - - - - - - - - - - - - - - -
CGTGCCTTCTTTGCT---------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S M E I F A F H P Q L K R W V E V G N S G L F R
S M E I F A - - - - - - - - - E V G N S G L F -
TCCATGGAAATTTTTGCA---------------------------GAGGTGGGTAACTCTGGACTCTTC---
481482483484485486487488489490491492493494495496497498499500501502503504
P E V L L P L G L P E D V Q V L A W G L S L E R
- - - - - - - - - - - - V Q V L A W G L S L E R
------------------------------------GTGCAAGTCCTGGCTTGGGGCCTTAGCCTAGAGAGG
505506507508509510511512513514515516517518519520521522523524525526527528
P T M I V H E I S N I R D L I G P S T S L E L I
P T M I - - - - - - - - - - - - - - - - - - - -
CCAACCATGATC------------------------------------------------------------
529530531532533534535536537538539540541
R E Y R V F T P A H A S L
- - - - - - - - - - - - -
---------------------------------------
Class II
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_pro_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P A E R K R W S Q E F S R W F D W V L E E A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y D Y G R Y P V K G M G I W M P Y G Y Q I R R
- - - - - - - - - - - - - - - - - - - - - I R R
---------------------------------------------------------------ATTCGGCGC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R V V E L I R D V L D E K G H E E V L F P L L I
R V V E L I R D V L D E K G H E E V L F P L L I
CGTGTCGTCGAACTCATCCGTGACGTCCTTGACGAGAAGGGGCACGAGGAAGTCCTCTTCCCCCTGCTTATA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P E T L L R K E S E H I R G F E G E V Y W V T H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G G T E P L D I K L A L R P T S E T S I T Y M E
- - - - - - - - - - A L R P T S E T S I T - - -
------------------------------GCTCTGCGCCCAACGAGCGAAACGAGTATAACC---------
121122123124125126127128129130131132133134135136137138139140141142143144
S F W I K S Y K Q L P R K F Y Q I V S I F R Y E
- - - - - - - - - - - R K F Y Q I V S I F R Y -
---------------------------------CGGAAGTTCTACCAGATAGTCAGCATATTCCGCTAC---
145146147148149150151152153154155156157158159160161162163164165166167168
T K A T R P L I R L R E V T T F K E A H T V H V
- - - - - - - - - - R E V T . F K E A H T V - -
------------------------------CGCGAAGTAACC---TTCAAGGAAGCCCACACAGTC------
169170171172173174175176177178179180181182183184185186187188189190191192
D F E D A D R Q V A E A I E L Y K R I F D E L G
- - - - - - - - V A E A I E L Y K R I F D - - -
------------------------GTAGCCGAGGCAATAGAGCTCTACAAGCGTATATTCGAC---------
193194195196197198199200201202203204205206207208209210211212213214215216
I P Y V I S R R P E W D K F A G A I Y T V A F D
- - - - - - - - - - - - - - - - - - - T V A F D
---------------------------------------------------------ACAGTGGCATTCGAC
217218219220221222223224225226227228229230231232233234235236237238239240
T V M P D G R T L Q I G T A H H L G Q N F T I P
T - - - - - - - - Q I G T A H H L - - - - - - -
ACC------------------------CAGATAGGCACAGCACACCACCTA---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F E V R I Q L P D E S L D Y A W Q T S Y G L S D
- - - - - - - - - - - - - - A W Q T S Y G L S D
------------------------------------------GCCTGGCAAACAAGCTACGGGCTAAGTGAC
265266267268269270271272273274275276277278279280281282283284285286287288
R V V A T V I A I H G D D R G A V L P P I V A P
R V V A T - - - - - - - - - - - - - - - - - - -
CGTGTAGTAGCCACA---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I Q V V V V P I P A R D E E Q R K R L Q D Y I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E V E E K L R R L G V R Y R I D D R E D V R P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R K F Y E W E A R G V P V R I E V G P R E A E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R T L V L A R R D T L E K T T I S I D E L E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L P E L L E D I A R S L R E R A W N W L Q S K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K R V E T V E E A R C V I E E E R G I V E L P W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
C G R E E C G L R L E E S I D A G V L G S P L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R P E W V R G K Q C P V C G Q P A V T S I R L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483
K K Y
- - -
---------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_pro_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E N K K E N F S E W Y N E I V T I S D L S D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R Y P I K G M N V W R P Y G W K I M K L I D N I
- - - - - - - - - - - - - - - - I M K L I D N I
------------------------------------------------ATAATGAAGCTTATAGACAACATA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I R N A V D K H S F D E V N F P V L I S R G M L
I R N A V D K H S F D E V N F P V L I - - - - -
ATAAGAAATGCCGTGGATAAACATTCTTTTGATGAGGTCAATTTTCCAGTTTTGATA---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E V E F E H I R G F E N E I Y W V T K G G K E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E E E L A L R P T S E S A M Y P M F S L W V R
- - - - - A L R P T S E S A M Y - - - - - - - -
---------------GCTTTACGCCCCACTAGCGAATCTGCTATGTAT------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S H A D L P L K I Y Q I V S V Y R Y E T K H T R
- - - - - - L K I Y Q I V S V Y R Y - - - - - -
------------------TTGAAGATTTACCAGATAGTAAGCGTGTACAGGTAT------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S F I R I R E I H F F E A H T A H E S Y E D A E
- - - - - R E I H F F E A H T A - - - - - - - -
---------------AGAGAAATCCACTTTTTCGAGGCCCATACCGCT------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K Q M D E Y R I I W T E I A D A L C L P F L Y D
- - M D E Y R I I W T E I A D - - - - - - - - -
------ATGGATGAATACAGGATCATATGGACGGAAATAGCAGAT---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q R P E W D K F P G A M Y T I A F D T V M P S G
- - - - - - - - - - - - - T I A F D T - - - - -
---------------------------------------ACTATAGCCTTCGATACA---------------
217218219220221222223224225226227228229230231232233234235236237238239240
R S L Q I G T I H Q Y G T N F S K N Y D I K Y L
- - - Q I G T I H Q Y - - - - - - - - - - - - -
---------CAGATCGGTACAATTCACCAATAC---------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K E D G T F E Y V H Q T T F G M S E R L L A A I
- - - - - - - - V H Q T T F G M S E R L L A A -
------------------------GTACATCAGACAACGTTTGGCATGAGCGAAAGACTTCTTGCGGCA---
265266267268269270271272273274275276277278279280281282283284285286287288
I G I H G D D K G L I L P P A I A P I Q V V I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P I P G E G V E R Y A K D I E T T L N G I G I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
C H V D N R D N Y T P G Y K Y N D W E M R G V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L R I E V G E R E L K E K T V T L A A R N I R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K K T V Q R E K L V Y E V P D M L D L V K E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T E D A K K T F N S L V V S A S S L D D F K K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G L I K A F W C G S K E C S D K I E N E T E K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A L G F N L N N D E T G K C I V C G K A G K L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462
I F S R S Y
- - - - - -
------------------
Class II
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_pro_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E N K K E N F S E W Y N E I I T L A E L S D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R Y P V K G M N V W L P Y G W K I M S L I D S I
- - - - - - - - - - - - - - - - I M S L I D S I
------------------------------------------------GTCGGAACATTCCTTCGAACCACA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V R R A V D K R N F Q E V N F P I L I G R S M L
V R R A V D K R N F Q E V N F P I L I - - - - -
CCAGAATGCGGTTATAAGGCCATCCCTGTTGAATTCTTCAAGTTTCGTTGCCCTGAA---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E V E F E H I R G F E N E I Y W V T K G G K E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E E E L A L R P T S E S A M Y P M F S L W I R
- - - - - A L R P T S E S A M Y - - - - - - - -
---------------AAGCTTTCCCTGAATGTTTCTCATCGAAATGGT------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S H A D L P L K I Y Q I V S V Y R Y E T K H T R
- - - - - - L K I Y Q I V S V Y R Y - - - - - -
------------------AAGTGGGACGCCCCTCATCTCCCAGTCGTTGAACTT------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S F I R I R E I H F F E A H T A H A T Y E D A E
- - - - - R E I H F F E A H T A - - - - - - - -
---------------CTTGACCCTTATATTTATGCTATTAAGCGTATT------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A Q M D Q Y K E I W R E I S S L L C L P Y F Y D
- - M D Q Y K E I W R E I S S - - - - - - - - -
------TGCGCCGGGTATGGGTATTATGATCACCTGTATCGGAGC---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Q R P D W D K F P G A M Y T I A F D T V L P S G
- - - - - - - - - - - - - T I A F D T - - - - -
---------------------------------------CTCACTCATACCATAAGT---------------
217218219220221222223224225226227228229230231232233234235236237238239240
R S L Q I G T I H Q Y G T N F S K N Y D I K Y L
- - - Q I G T I H Q Y - - - - - - - - - - - - -
---------TCCATCCTCCTTAAGATACTTTAT---------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K E D G T F D Y A H Q T T Y G M S E R L L A A I
- - - - - - - - A H Q T T Y G M S E R L L A A -
------------------------TGATGGAAGAACGGTGTCGAAGGCTATCGTGTACATTGCCCCTGG---
265266267268269270271272273274275276277278279280281282283284285286287288
I G I H G D D K G L V L P P D V A P I Q V I I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P I P G A G V M E Y A R D V E N T L N S I N I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V K V D D R E N Y T P G Y K F N D W E M R G V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L R I E I G E R E V K N R T L T I S M R N I Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K L T I E R S K L I Y E V P D T L I R I R E K M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
M E N A Q K V F K D H V F R A T K L E E F N R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G L I T A F W C G S K E C S D K I E A E T E K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V L G F M V D S S E T G K C V V C G K N G K M A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462
V F S R S Y
- - - - - -
------------------
Class II
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_pro_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E L I R E A R P H S R E K L K S N L I E W F H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W L L R E A E L Y D V R Y P V K G A Y V W R P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G M K I R R N V E N L I R K F H D E T G H E E V
- - - I R R N V E N L I R K F H D E T G H E E V
---------GTTGTCCCCGCTCCACGGGATCTCCACTACCTTGCCCTCTTTTATCGCGGCTTTTGCTACCTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L F P V F I P Y E F F G K E S Q H I K G F E K E
L F P V F I - - - - - - - - - - - - - - - - - -
TATATCCTCGGCCTTGAC------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V F W V S K G G E A G E R L V L R P T S E T A I
- - - - - - - - - - - - - - V L R P T S E T A I
------------------------------------------CACCGCGTATTTCTCCAATGTATCCCTCCT
121122123124125126127128129130131132133134135136137138139140141142143144
M P M V K L W I Q D Y K D L P L R V Y Q I V S V
M - - - - - - - - - - - - - - L R V Y Q I V S V
CGC------------------------------------------GACCCTGAGAGGTACGCCTTTTAACTC
145146147148149150151152153154155156157158159160161162163164165166167168
F R A E T K M T H P M I R L R E I S M F K E A H
F R A - - - - - - - - - - - R E I . M F K E A H
CCAGTAGTA---------------------------------GTCTACATA---ACGTATGCCTGCCTCATT
169170171172173174175176177178179180181182183184185186187188189190191192
T V H A D K E D A E R Q V R E A V E I Y K R I F
T V - - - - - - - - - - V R E A V E I Y K R I F
AAGCCG------------------------------TAACGGCGCCTCCTCCTCTCCGTAGTATATGGGGAT
193194195196197198199200201202203204205206207208209210211212213214215216
D E M C L A Y L I N K R P E W D K F A G A E Y T
D - - - - - - - - - - - - - - - - - - - - - - T
CAC------------------------------------------------------------------CAT
217218219220221222223224225226227228229230231232233234235236237238239240
I A F D T I L P D G R S L Q I G T V H Y L G T N
I A F D T - - - - - - - - Q I G T V H Y L - - -
TGCTGCAATACTCCT------------------------GTGTGCCAACTTCCTAGTCCCATC---------
241242243244245246247248249250251252253254255256257258259260261262263264
F T K V F E V T Y L D A D G T R K L A H T T S Y
- - - - - - - - - - - - - - - - - - A H T T S Y
------------------------------------------------------TATCTGTAACGACCTGCC
265266267268269270271272273274275276277278279280281282283284285286287288
G I S E R S I A A M L I T H G D D G G T T L P P
G I S E R S I A A - - - - - - - - - - - - - - -
GTCTGGGAGGATAGTGTCAAAGGCTAT---------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K L A P I Q V V V I P I Y Y G E E E A P L V M P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L V R E T A N R L N E A G I R V Y V D E R A D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T P G W K F Y Y W E L K G V P L R V E I G K R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V E K R Q A V I A R R D T L E K Y A V S I N E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V D A V K Q L M K S V E E N L R K R A W E E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G R V V K A E D I E V A K A A I K E G K V V E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P W S G D N D C G I K I Q E L V G A D A L G I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L D A D A S V G G Y D L R D L A C K E R R A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488
W L R L S E R Y
- - - - - - - -
------------------------
Class II
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_pro_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H A F L G N A Q L P S T P R G D R L E F S E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y A E V L R S A E I M D V R Y P V K G M Y V W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P Y G F E I R Q R V V E K L R R K L R E T G H E
- - - - - I R Q R V V E K L R R K L R E T G H E
---------------GGTCTCGACGATCCCCTCACCAACCAGTCTTCGTGCTTCCTCCGGGGAGTCCGTTCG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E V L F P T L I P E T Q L K K E S E H I A G F E
E V L F P T L I - - - - - - - - - - - - - - - -
GAATATACCCTTTTCGAACTTCTC------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D E V Y W V T H G G L K E L D E K L A L R P T S
- - - - - - - - - - - - - - - - - - A L R P T S
------------------------------------------------------CCGGAAGACTACCGCGGT
121122123124125126127128129130131132133134135136137138139140141142143144
E T A I Y P M F A L W I R S H A D L P L K I F Q
E T A I Y - - - - - - - - - - - - - - L K I F Q
ACCCTCCTCGAGTTC------------------------------------------CCAGTAATGGAACTT
145146147148149150151152153154155156157158159160161162163164165166167168
I V N T F R Y E T K H T R P L I R M R E I T T F
I V N T F R Y - - - - - - - - - - - R E I T . F
GCGTCCCGGGCTCATGTCGCG---------------------------------CAGCATCTCCTC---CTC
169170171172173174175176177178179180181182183184185186187188189190191192
K E A H T A H A T E E E A E E Q V K E A V E I Y
K E A H T A - - - - - - - - - - V K E A V E I Y
CGCGGCACGTTCCAGGAT------------------------------GACCATCACAACCTGGTACGGAGC
193194195196197198199200201202203204205206207208209210211212213214215216
S S F F D E L G I P Y I A S V R P E W D K F P G
S S F F D - - - - - - - - - - - - - - - - - - -
CACGTCCGGCGGTAG---------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A E Y T V A F D T L M P D G R T L Q I G T V H M
- - - T V A F D T - - - - - - - - Q I G T V H M
---------GCAGGTCATGTACACGTA------------------------GTAGGTGACCTCGAACGTTCT
241242243244245246247248249250251252253254255256257258259260261262263264
L G Q N F A R T F E V T Y E T E E G D Q E Y V Y
L - - - - - - - - - - - - - - - - - - - - - V Y
CGC---------------------------------------------------------------GTCGAA
265266267268269270271272273274275276277278279280281282283284285286287288
M T C Y G I S D R V V A S M I A I H G D E R G L
M T C Y G I S D R V V A S - - - - - - - - - - -
GGCCACCGTGTACTCGGCGCCCGGGAACTTGTCCCACTC---------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V L P P D V A P Y Q V V M V P I L K K G V R R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I L E R A A E V E E M L R E E G V R V K V D D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D M S P G R K F H Y W E L K G V P L R I E L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R E L E E G T A V V F R R D E L E R E T Y A F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E L P D V V P E L L E D I A M E L R K R A R E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F E K G I F R T D S P E E A R R L V G E G I V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T G W C G S E R C G V R M E E E F G G D V L G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P Y P E E D T E F E R C P I C G E T A E Y T V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485
I A K T Y
- - - - -
---------------
Class II
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_pro_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E S E K E A A L P P K E E F S D W Y N E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
W M A E I M D V R Y P V K G L Y V W Y P F G F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I R R S T Y N I I R E I L D N S G H Q E T L F P
I R R S T Y N I I R E I L D N S G H Q E T L F P
ATCAGGAGGAGTACTTACAATATCATAAGGGAAATTCTCGATAACAGTGGGCACCAGGAAACCCTTTTTCCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L L I P E N E F M K E A E H I K G F E N E V Y W
L L I - - - - - - - - - - - - - - - - - - - - -
CTGCTGATC---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V T H G G K D S L D I P L A L R P T S E T A I Y
- - - - - - - - - - - - - A L R P T S E T A I Y
---------------------------------------GCGCTCCGCCCCACAAGTGAGACTGCCATTTAT
121122123124125126127128129130131132133134135136137138139140141142143144
P M Y K M W V R S H A D F P I K L Y Q I V N T F
- - - - - - - - - - - - - - I K L Y Q I V N T F
------------------------------------------ATCAAACTCTACCAGATAGTCAACACTTTC
145146147148149150151152153154155156157158159160161162163164165166167168
R Y E T K H T R P L I R L R E I T S F K E A H T
R Y - - - - - - - - - - - R E I . S F K E A H T
CGCTAT---------------------------------AGGGAGATT---TCTTTTAAAGAAGCCCATACC
169170171172173174175176177178179180181182183184185186187188189190191192
V H A T W E D A E A Q V K E A V E L Y T E I Y R
V - - - - - - - - - - V K E A V E L Y T E I Y R
GTG------------------------------GTAAAGGAAGCTGTTGAACTTTACACCGAGATCTACCGC
193194195196197198199200201202203204205206207208209210211212213214215216
R L A V P V L R S R R P D W D K F P G A D Y T D
- - - - - - - - - - - - - - - - - - - - - - T D
------------------------------------------------------------------ACCGAT
217218219220221222223224225226227228229230231232233234235236237238239240
A I D A M M P D G R T L Q I G T V H H L G D N F
A I D A - - - - - - - - Q I G T V H H L - - - -
GCCATTGACGCC------------------------CAGATAGGAACCGTCCACCACCTT------------
241242243244245246247248249250251252253254255256257258259260261262263264
A K T F D I K Y E A P D G E Q R Y A H Q T C Y G
- - - - - - - - - - - - - - - - - A H Q T C Y G
---------------------------------------------------GCACACCAGACCTGTTACGGA
265266267268269270271272273274275276277278279280281282283284285286287288
I S E R S I A A T I S I H G D D K G L V L P P E
I S E R S I A A - - - - - - - - - - - - - - - -
ATTTCGGAGCGGTCTATTGCAGCC------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I A P V Q V V I I P I I F K K G A E E V L A A C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R D V Q E R L K K T G V K V E I D A S D L R P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A K Y Y R W E M K G V P L R L E I G P R D L E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N V A V S V R R D T G E K E Q I P L P E I E T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V L Q K F E A I Q N S L Y E K A K V G L E S R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F D C T E L E E V K E K I Q K G V A T I P W C G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K K E C G L A M E D R I G A G I L G I P L T P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G K G K E K C P V C G A E T E T R V Y V A R T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_pro_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E N F S E W Y H N I L E T A G I Y D L R Y P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K G C G V Y L P Y G F K I R R Y A F E A I R D M
- - - - - - - - - - - - I R R Y A F E A I R D M
------------------------------------ATAAGAAGATATGCATTTGAAGCCATAAGAGATATG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L D E S N H D E A L F P M L I P E D L L A K E G
L D E S N H D E A L F P M L I - - - - - - - - -
CTTGACGAATCAAACCACGATGAAGCACTATTCCCAATGTTAATT---------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E H I K G F E E E V Y W V T H G G T T P L D V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L A L R P T S E T P I Y H M M K L W I K V H T D
- A L R P T S E T P I Y - - - - - - - - - - - -
---GCTTTAAGACCAACATCAGAAACTCCAATATAT------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L P I K I Y Q I V N S F R Y E T K H T R P L I R
- - I K I Y Q I V N S F R Y - - - - - - - - - -
------ATAAAAATATATCAAATTGTAAATTCATTTAGATAT------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L R E I M T F K E A H T A H S T S E E A E A Q V
- R E I . T F K E A H T A - - - - - - - - - - V
---AGAGAAATA---ACCTTTAAAGAGGCACATACAGCA------------------------------GTG
169170171172173174175176177178179180181182183184185186187188189190191192
Q T A L N I Y K T F F D R M G V P T I V S Q R P
Q T A L N I Y K T F F D - - - - - - - - - - - -
CAAACTGCACTAAATATATATAAAACATTCTTTGAT------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E W D K F P G A D Y T M A F D T I F P D G K T M
- - - - - - - - - - T M A F D T - - - - - - - -
------------------------------ACAATGGCTTTTGATACT------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q I G T V H N L G Q H F A K T F E L E F E T P E
Q I G T V H N L - - - - - - - - - - - - - - - -
CAAATTGGGACGGTGCATAATTTG------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
G G K D Y A Y Q T C Y G I S D R I I A S I I A L
- - - - - A Y Q T C Y G I S D R I I A S - - - -
---------------GCATACCAAACATGCTATGGTATTTCAGATAGAATAATAGCTTCA------------
265266267268269270271272273274275276277278279280281282283284285286287288
H G D E K G L I L P P E V A P H Q I I I I P L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F K G K E E I A M N K A K E I Y K S L K N T Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V K L D D R D I R P G K K F N D W E L K G A P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R I E L G P R D I E N N K L T I Y R R D T G E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F Q I D E D N L L N E L N T L I D S I E N T I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E K A E Q K V K S F I T I L D N H D V N N I K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T L S T K K G V V L V P Y D E N I Y T E E F E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E I D A S V L G T T E Y D G K K Y I S I A K T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_pro_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V K K S E N P K E W Y N E I V R K A N I I D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A Y P V K G M P V Y K P Y G Y K A F K F L M S L
- - - - - - - - - - - - - - - - A F K F L M S L
------------------------------------------------TTTTATTTGGTTAGCACAGCTTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L E N K L E S I G A E P A W F P I V I P Y S I F
L E N K L E S I G A E P A W F P I V I - - - - -
TCTCATACAGAATGGGGCTTTTGCTATTTTGTTTTGCTCTATGGCTTCTTTTAATTC---------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K K E S E H I K G F E E E V F W I E R A G N D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E D P L I L R P T S E T E M Y Y M F A K W I E
- - - - - I L R P T S E T E M Y - - - - - - - -
---------------CTCGTTTAGAGAAATTGTGTATTTCTTTTTGTT------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S Y R D L P L I I Y M T N T V Y R Y E T K S T K
- - - - - - L I I Y M T N T V Y R Y - - - - - -
------------------TAAGCCAATGTCTATTCTTAATGGAACCCCAATCAA------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A L I R G R E V L W N E T H S V H R S E E D A R
- - - - - R E V L W N E T H S V - - - - - - - -
---------------TGTATCGTCCGAATCTAAATAAACTCTATATTT------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E H M A K A K E V Y D Y I F W D V L Y L P Y I W
- - M A K A K E V Y D Y I F W - - - - - - - - -
------ATACTCTATTACTTTTGTATCGTCTTTGCCCAAAATTGG---------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V R R P E W D K F P G G E E T Y A A D A I M P D
- - - - - - - - - - - - - - T Y A A D A - - - -
------------------------------------------CAAAGCGCCTCCAAAAGC------------
217218219220221222223224225226227228229230231232233234235236237238239240
G R F L Q V G T I H L L G Q K F A I P F E I K F
- - - - Q V G T I H L L - - - - - - - - - - - -
------------TTGCCATACATATTTTCTAAAATC------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L D Y H P F Y K K Y G D P N I Y I K D K N G N E
- - - - - - - - - - - - - - - - I . . . . . . .
------------------------------------------------TAA---------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y K V H A P K E F W E E L E K G K L T K T Y T I
. . . . . P . . . . . . . . . . . . . . . . . .
---------------CGC------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K I G D K E Y T I S S I E E I N E K L K E Y D F
. . . . . . . . . . . . . . . . . . . . . . . .
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R K Y V W Q T S Y G I S M R A F G G A L Y W L G
. . . . . Q T S Y G I S M R A F G G - - - - - -
---------------TTGTAAAAACCTACCATCTGGCATTATTGCATCTGCAGC------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D D L G L V M P Y K I A P I Q I V I I P I L G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D D T K V I E Y S K K V Y E L I K D K Y R V Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D S D D T K T P G Y K Y Y Y Y D L I G V P L R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D I G L K E V E N N S I T I V R R D N K K K Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I S L N E L E K I D Q I F K E M E E D L K Q K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K S F V N D M V V R V K T F D E L K E A I E Q N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K I A K A P F C M R E S C A N Q I K E L L H A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V R G T D I N P E N A E K E R C V Y C G E P A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537
Y W V Y I G K T Y
- - - - - - - - -
---------------------------
Class II
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_pro_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V E R K R W S E E F S E W F N E V I E E A G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L D K R Y P V K G M N V W L P Y G L K I M R N I
- - - - - - - - - - - - - - - - - - - I M R N I
---------------------------------------------------------ATAATGAGGAATATT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E K F I H E E M E R T G H Q E V L F P A L I P E
E K F I H E E M E R T G H Q E V L F P A L I - -
GAGAAGTTCATCCACGAGGAGATGGAGAGGACTGGTCACCAGGAAGTTTTATTCCCAGCTCTAATC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T E F K K E A E H I A G F E G E V F W V T H A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H E P L D V R L V L R P T S E T A M Y S M F A L
- - - - - - - - V L R P T S E T A M Y - - - - -
------------------------GTATTAAGGCCGACAAGCGAGACGGCCATGTAT---------------
121122123124125126127128129130131132133134135136137138139140141142143144
W I R S H A D L P F K V Y Q I V N V Y R Y E T K
- - - - - - - - - F K V Y Q I V N V Y R Y - - -
---------------------------TTTAAGGTTTATCAGATAGTGAATGTCTATAGATAT---------
145146147148149150151152153154155156157158159160161162163164165166167168
H T R P L I R V R E I S R F F E A H T A H A D F
- - - - - - - - R E I . R F F E A H T A - - - -
------------------------AGGGAGATA---AGATTCTTTGAAGCTCACACGGCC------------
169170171172173174175176177178179180181182183184185186187188189190191192
E D A E R Q I K E D L E I F D N L M R K L A L A
- - - - - - I K E D L E I F D N L M R - - - - -
------------------ATAAAAGAGGATCTCGAGATATTCGATAATTTAATGAGG---------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y I I S K R P E W D K F P G A F Y S L G A E V V
- - - - - - - - - - - - - - - - - S L G A E V -
---------------------------------------------------TCCCTGGGAGCTGAAGTA---
217218219220221222223224225226227228229230231232233234235236237238239240
M P D G R T L Q I G T M H N Y K Q N F S K A Y N
- - - - - - - Q I G T M H N Y - - - - - - - - -
---------------------CAGATAGGGACGATGCACAACTAT---------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I L Y E K E D G T H D Y V H Q T T F G M S E R L
- - - - - - - - - - - - V H Q T T F G M S E R L
------------------------------------GTTCACCAAACGACATTTGGGATGAGCGAAAGATTG
265266267268269270271272273274275276277278279280281282283284285286287288
L A A V I A I H G D D R G M V L P P T I A P I Q
L A A - - - - - - - - - - - - - - - - - - - - -
CTAGCCGCA---------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V V I V P I P K K G S E E E V Y S Y A K G I E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E L R D A G I R V Y L D L R D K R P G W K F Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
W E L K G V P V R V E V G P I D V Q N S T V V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A R R D K L E K I T V K R E E L V D K V R E L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E D I M E F L Y E R A N E W L E S H I K R V D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L E E A K A V F E D R R G I V E I P W C G E E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
C G L K M E E E L E A K M L G I P Y P E E K A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A P E G S K C P V C G R E A K F I A R F A R T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_pro_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A D V I T P R S V D Y A Q W Y V D V V R A A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A D Y S P V R G C M I I L P N G Y A L W E N M
- - - - - - - - - - - - - - - - - - - L W E N M
---------------------------------------------------------CTCTGGGAGAACATG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R A V L D R M F K E T G H E N A Y F P L F I P Q
R A V L D R M F K E T G H E N A Y F P L F I - -
CGGGCCGTACTCGACCGCATGTTCAAAGAAACCGGCCACGAAAACGCCTATTTCCCGCTGTTCATC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S F L A K E A E H V E G F A K E C A V V T H S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K I D E K G Q L I P D P E S K L E E N L I V R
- - - - - - - - - - - - - - - - - - - - - I V R
---------------------------------------------------------------ATCGTCCGT
121122123124125126127128129130131132133134135136137138139140141142143144
P T S E T I I W D A F S R W I Q S W R D L P I L
P T S E T I I W - - - - - - - - - - - - - - I L
CCCACCAGCGAGACGATCATCTGG------------------------------------------ATCCTG
145146147148149150151152153154155156157158159160161162163164165166167168
I N Q W A N V V R W E M R T R L F L R T M E F L
I N Q W A N V V R W - - - - - - - - - - M E F L
ATCAACCAGTGGGCGAACGTGGTGCGCTGG------------------------------ATGGAATTCCTC
169170171172173174175176177178179180181182183184185186187188189190191192
W Q E G H T A H A T R E E A I E E A L R I L D I
W Q E G H T A - - - - - - - - - - A L R I L D I
TGGCAGGAAGGTCACACGGCC------------------------------GCGCTGCGCATTCTGGACATC
193194195196197198199200201202203204205206207208209210211212213214215216
Y T T F A E E Y M A M P V I Q G V K T P S E R F
Y T T F A E - - - - - - - - - - - - - - - - - -
TACACGACGTTCGCCGAA------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A G A V D T Y C I E A L M Q D G R A L Q A G T S
- - - - - T Y C I E A - - - - - - - - Q A G T S
---------------ACCTATTGCATCGAGGCG------------------------CAGGCCGGCACCAGC
241242243244245246247248249250251252253254255256257258259260261262263264
H F L G Q N F A K A F D C K F Q N Q N N E L E Y
H F L - - - - - - - - - - - - - - - - - - - - -
CACTTCCTG---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V W A T S W G V S T R L I G A L V M T H S D D Q
V W A T S W G V S T R L I G A - - - - - - - - -
GTCTGGGCCACCTCGTGGGGCGTTTCGACGCGCCTGATCGGGGCC---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G L V L P P R L A P T Q V V I I P I F R N D V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K S A V L E Q A G R I E R E L K D A G F T V K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D A R E T H R P G W K F N E Y E V Q G V P V R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A I G P R D V E Q G T V E L A R R D T R T K E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V P Q E G L A E R V R M L L D D I Q Q N L L A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A R A F R D E M T T R V D T Y E E F K E V L E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K G G F I L A H W D G T P E T E A R I K E E T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A T I R C I P L D R D A E A L G T R E E G R D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496
L T G K P S K Q R V V F A K A Y
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Archaea/Staphylothermus marinus/Smarinus_pro_aa
Archaea/Staphylothermus marinus/Smarinus_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L R E I S L F G E M G G I L S L E R F R L D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y A D F P K W Y H E I L K H A K I V D T R Y P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K G M N V W M P Y G L K A L R M I Q K I M I N L
- - - - - - - - - - - - A L R M I Q K I M I N L
------------------------------------GCTTTGAGAATGATCCAAAAAATAATGATTAATCTT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L E E T G H E E A Y F P T M I P E S V F S K E K
L E E T G H E E A Y F P T M I - - - - - - - - -
CTCGAAGAAACTGGGCACGAAGAAGCATATTTTCCAACAATGATA---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D F L Q G F G G E T F V V E G T M T K K F N E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L F V R P T S E T V M Y Y M W N I W I K G R K D
- F V R P T S E T V M Y - - - - - - - - - - - -
---TTTGTTCGCCCTACTAGTGAAACAGTCATGTAT------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L P L K M Y Q V V N V F R Y E T K M T H P I L R
- - L K M Y Q V V N V F R Y - - - - - - - - - -
------CTGAAAATGTATCAAGTGGTCAATGTATTCAGATAT------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V R E I M S F I E A H T A H A T S E E A E K Q I
- R E I . S F I E A H T A - - - - - - - - - - I
---AGAGAAATA---AGTTTTATAGAAGCACACACAGCC------------------------------ATC
193194195196197198199200201202203204205206207208209210211212213214215216
N E A L S I Y K K F F D S L L L P Y F I V K T P
N E A L S I Y K K F F D - - - - - - - - - - - -
AATGAAGCCTTAAGCATATATAAAAAATTCTTTGAC------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P W D T F A G A E Y N Y D F I T A M P D G K G L
- - - - - - - - - - N Y D F I T - - - - - - - -
------------------------------AACTACGACTTCATAACA------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E L G S V I N L G Q K F A R A F D I K F M D S D
E L G S V I N L - - - - - - - - - - - - - - - -
GAACTGGGTTCAGTTATTAATCTT------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G V T K H V Y Q T C Y G V S E R T L G A V I A I
- - - - - V Y Q T C Y G V S E R T L G A - - - -
---------------GTTTATCAAACATGTTATGGTGTAAGTGAGAGAACATTAGGAGCT------------
289290291292293294295296297298299300301302303304305306307308309310311312
H G D Q K G L F L P P I I A P I Q V V I V P I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R R D E Q D I I E Y A K K I S E K L K K A G I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T F L D D D P E H T P G W K Y Y F W E M K G V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T R I E I G R R E L N N N T V T I A R R D G A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K I T V S I N D M V D K L R S I W I E I N D Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R K K A I E H L K K M T I I T Y K P E E I G K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
V K G L I I T P W D G T K E C A D K L E E I T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K Q V L G E I I E S P I K L P S L Q G K T I C N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493
N K P D R Y A L I G T T Y
- - - - - - - - - - - - -
---------------------------------------
Class II
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_pro_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P A K R E R W S R E F S R W F D W V L E E A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I Y D Y G R Y P V K G M G V W L P Y G F Q I R R
- - - - - - - - - - - - - - - - - - - - - I R R
---------------------------------------------------------------ATTAGGAGG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R V I E L V R R V L D G A G H E E V L F P L L I
R V I E L V R R V L D G A G H E E V L F P L L I
AGGGTTATCGAGCTCGTCAGGAGGGTGCTCGACGGGGCCGGGCATGAGGAGGTTCTCTTCCCCCTGCTGATA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P E T L L R R E S E H I R G F E G E V Y W V A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G G S E P L D V R L A L R P T S E T S I S Y M E
- - - - - - - - - - A L R P T S E T S I S - - -
------------------------------GCGCTGCGGCCCACGAGCGAGACGAGTATAAGC---------
121122123124125126127128129130131132133134135136137138139140141142143144
S F W I K S Y K Q L P R R F Y Q I V S I F R Y E
- - - - - - - - - - - R R F Y Q I V S I F R Y -
---------------------------------CGCCGGTTCTACCAGATAGTGAGCATTTTCCGCTAC---
145146147148149150151152153154155156157158159160161162163164165166167168
T K A T R P L I R L R E V T T F K E A H T V H A
- - - - - - - - - - R E V T . F K E A H T V - -
------------------------------AGGGAGGTAACC---TTCAAGGAGGCCCACACGGTT------
169170171172173174175176177178179180181182183184185186187188189190191192
S F E D A D R Q V A E A I E L Y K R I F D E L G
- - - - - - - - V A E A I E L Y K R I F D - - -
------------------------GTGGCGGAGGCTATAGAGCTCTACAAGCGGATATTCGAC---------
193194195196197198199200201202203204205206207208209210211212213214215216
I P Y A V S R R P E W D K F A G A V Y T V A F D
- - - - - - - - - - - - - - - - - - - T V A F D
---------------------------------------------------------ACAGTGGCCTTCGAT
217218219220221222223224225226227228229230231232233234235236237238239240
T V M P D G R V L Q I G T V H H L G Q N F T I P
T - - - - - - - - Q I G T V H H L - - - - - - -
ACA------------------------CAGATAGGCACCGTGCACCACCTG---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F E V R I Q L P D E S L D Y A W Q T S Y G L S D
- - - - - - - - - - - - - - A W Q T S Y G L S D
------------------------------------------GCCTGGCAGACGAGCTACGGGCTCAGCGAC
265266267268269270271272273274275276277278279280281282283284285286287288
R V I A S L I A L H G D D R G A A L P P A V A P
R V I A S - - - - - - - - - - - - - - - - - - -
AGGGTGATAGCGAGC---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I Q V V V V P I P A R G E E Q A R R L E E Y I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E V E E R L R R L G L R Y H V D R R E E V R P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R K F Y E W E A R G V P V R I E A G P K E A E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R T L V V A R R D T L E K T V V K L E E L E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L P G I L E D V A R G L R E R A W S W L R S K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K R V E G V E E A G R A I E E E R G I V E L P W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
C G N E E C G K R L E E E V D A A V L G S P L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R P E W V R G K R C P V C G R P A V T S I R L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483
K T Y
- - -
---------
Class II
Bacteria/Escherichia coli/amino acid sequences/Ecoli_pro_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S Q A R L E P V L P S N W N R N N M R T S Q Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L L S T L K E T P A D A E V I S H Q L M L R A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
M I R K L A S G L Y T W L P T G V R V L K K V E
- - - - - - - - - - - - - - - - - - V L K K V E
------------------------------------------------------CACTTCGATACCTTGTGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N I V R E E M N N A G A I E V L M P V V Q P S E
N I V R E E M N N A G A I E V L M P V V Q - - -
GCGCAGTTCGCTGTACAGTTTCTCAGCAAGTTCCTGTACGCGGAAGGATTTGTGCATGTTCAT---------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L W Q E S G R W E Q Y G P E L L R I A D R G D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P F V L G P T H E E V I T D L I R N E L S S Y K
- - V L G P T H E E V I T - - - - - - - - - - -
------CACACGCGTTACGCCGATACCGTAGCAACCCAT---------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q L P L N F Y Q I Q T K F R D E V R P R F G V M
- - - L N F Y Q I Q T K F R D - - - - - - - - -
---------TTTCAGTGCTTCGGAGTACTTGGTACCCAGCTGGAA---------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R S R E F L M K D A Y S F H T S Q E S L Q E T Y
- - R E F L M K D A Y S F - - - - - - - - - - Y
------CAGCGTACCCTGACCATCCGGGCTTGGATCGCC------------------------------CGG
193194195196197198199200201202203204205206207208209210211212213214215216
D A M Y A A Y S K I F S R M G L D F R A V Q A D
D A M Y A A Y S K I F S - - - - - - - - - - - -
AGTAGCGACATCGCGATCCCAGTTGATACCGAAGTA------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
T G S I G G S A S H E F Q V L A Q S G E D D V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F S D T S D Y A A N I E L A E A I A P K E P R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A A T Q E M T L V D T P N A K T I A E L V E Q F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N L P I E K T V K T L L V K A V E G S S F P L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A L L V R G D H E L N E V K A E K L P Q V A S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L T F A T E E E I R A V V K A G P G S L G P V N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
M P I P V V I D R T V A A M S D F A A G A N I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G K H Y F G I N W D R D V A T P E I A D I R N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V A G D P S P D G Q G T L L I K R G I E V G H I
- - - - - - - - - - - - - L I K R G I E V G H I
---------------------------------------GGAACGCATGACGCCAAAACGCGGACGCACTTC
433434435436437438439440441442443444445446447448449450451452453454455456
F Q L G T K Y S E A L K A S V Q G E D G R N Q I
F Q L - - - - - - - - - - - - - - - - - - - - -
GTCGCGGAA---------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L T M G C Y G I G V T R V V A A A I E Q N Y D E
L T M G C Y G I G V T R V V A A - - - - - - - -
CAGGTCTGTAATCACTTCTTCATGAGTTGGGCCGAGTACGAACGGACG------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R G I V W P D A I A P F Q V A I L P M N M H K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F R V Q E L A E K L Y S E L R A Q G I E V L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D R K E R P G V M F A D M E L I G I P H T I V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G D R N L D N D D I E Y K Y R R N G E K Q L I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590
T G D I V D Y L V K Q I K G
- - - - - - - - - - - - - -
------------------------------------------
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_pro_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P K E V I T Q R S V D Y N Q W Y L D I V R E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D L A E V A E V V R G C I V V K A H G W A I W E
- - - - - - - - - - - - - - - - - - - - - I W E
---------------------------------------------------------------GGCGGTACT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L M Q R A L D D R I K A T G H A N V Q F P L L I
L M Q R A L D D R I K A T G H A N V Q F P L L I
GCCGGCCCAATAGGCACGGGCGAAGCCGCGTTCGATCTGTTCTTTAAGCTCGTCATAGGTTGTGACATCGGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P K S F I M K E A E H V E G F A P E V A E V T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A G G E E L A E P Y V I R P T S E T I I G Y F Y
- - - - - - - - - - V I R P T S E T I I G - - -
------------------------------ACTCTTGCCGGCTTTGCCTGGCATATCGCGGCG---------
121122123124125126127128129130131132133134135136137138139140141142143144
S K W I R S Y R D L P L L Y N Q W A N V M R W E
- - - - - - - - - - - L L Y N Q W A N V M R W -
---------------------------------CTCGATCCGCACCGGCACCCCTTTCAGTTCCCACTC---
145146147148149150151152153154155156157158159160161162163164165166167168
M R T R P F L R T A E F W W Q E G H T A H A T E
- - - - - - - - - A E F W W Q E G H T A - - - -
---------------------------GCGATCGTCAACCTTAAAGCGCAACCGGCCCTT------------
169170171172173174175176177178179180181182183184185186187188189190191192
A E A E E E T L R I L H E V Y A D F V E K E M A
- - - - - - T L R I . H E V Y A D F V E - - - -
------------------CATCACTGCGCT---CTCTTCATCGTTCTTGTAAATTGGCAC------------
193194195196197198199200201202203204205206207208209210211212213214215216
V P V I R G L K T E K E K F P G A L R S Y C I E
- - - - - - - - - - - - - - - - - - - S Y C I E
---------------------------------------------------------CAGAGCGCCGATCAG
217218219220221222223224225226227228229230231232233234235236237238239240
A M M Q D G R A L Q A G T S H N L G Q N F A R A
A - - - - - - - - Q A G T S H N L - - - - - - -
GCG------------------------CCACGCATACTGGATGGTGTTATG---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F D I T F T D Q H N T I Q Y A W T T S W G V S T
- - - - - - - - - - - - - - A W T T S W G V S T
------------------------------------------GGCTTGGAGGGCGCGACCATCTTGCATCAT
265266267268269270271272273274275276277278279280281282283284285286287288
R L I G A L I M T H S D D E G L V L P P R L A P
R L I G A - - - - - - - - - - - - - - - - - - -
TGCTTCGATGCAATA---------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I Q V V V V P I Y K N D E E R S A V M E A V N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
M T A A W K G R L R F K V D D R D T Y S P G Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
F N E W E L K G V P V R I E I G P K D V A K E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V A L A R R D M P G K A G K S F V P Q A G L T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R I E A L L A E M Q T G L F Q R A L A F R E A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T A D V T T Y D E L K E Q I E R G F A R A Y W A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
G S T A D E K R I Q E E T R A T I R C I P L E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P G T V G R C V Y T G R E T D R Q V I F A R A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_pro_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K A S R F F I G T L K E A P A D A E I V S H K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L M V R A G M I R R V A G G I Y N Y L P V G L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S I R K V E A I V R E E M N R A G A I E L L M P
S I R K V E A I V R E E M N R A G A I E L L M P
TCGATTCGCAAGGTCGAGGCGATCGTGCGCGAGGAGATGAACCGGGCGGGCGCGATCGAGCTGCTGATGCCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A V Q P A E L W Q E S G R W E Q Y G P E L L R F
A V Q - - - - - - - - - - - - - - - - - - - - -
GCCGTGCAG---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K D R K Q N E F V I G P T H E E V V T D I A R N
- - - - - - - - V I G P T H E E V V T - - - - -
------------------------GTGATCGGGCCGACGCACGAAGAAGTCGTCACG---------------
121122123124125126127128129130131132133134135136137138139140141142143144
Q I K S Y R Q M P V N F Y Q I Q T K F R D E I R
- - - - - - - - - V N F Y Q I Q T K F R D - - -
---------------------------GTGAACTTCTATCAGATCCAGACGAAGTTCCGCGAC---------
145146147148149150151152153154155156157158159160161162163164165166167168
P R F G V M R G R E F I M K D A Y S F D K D H E
- - - - - - - - R E F I M K D A Y S F - - - - -
------------------------CGCGAGTTCATCATGAAGGACGCGTATTCGTTC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L K E S Y K K M Y D A Y V R I F T R I G L E F
- - - - - Y K K M Y D A Y V R I F T - - - - - -
---------------TACAAGAAGATGTACGACGCGTACGTGCGGATCTTCACG------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R P V A A D N G S I G G S G S H E F H V I A D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G E D A I A Y C P T S D F A A N V E A A E A L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L L A S R A A P A E A M Q K V A T P G K A K C E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A V A E L M G I P L E R T I K S I V L A T D N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G A E P T V W L L M L R G D H D L N E I K T A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L P G L A G Y R F A T E A E I V E W F G T P P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
Y L G P I G T K K P V R V V A D R T V A N M S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
F V V G A N E V D Y H I A G V N W G R D L P E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V I A D I R N V K A G D P S P D G K G V L D I C
- - - - - - - - - - - - - - - - - - - - - D I C
---------------------------------------------------------------GACATCTGC
409410411412413414415416417418419420421422423424425426427428429430431432
R G I E V G H V F Q L G T K Y S D A M G A T F I
R G I E V G H V F Q L - - - - - - - - - - - - -
CGCGGCATCGAAGTCGGCCATGTGTTCCAACTC---------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
D E S G K A Q P M V M G C Y G I G V T R I L G A
- - - - - - - - M V M G C Y G I G V T R I L G A
------------------------ATGGTGATGGGCTGCTACGGGATCGGCGTCACGCGGATTCTCGGCGCG
457458459460461462463464465466467468469470471472473474475476477478479480
A I E Q N F D D K G I I W P E A I A P F E V V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
C P M G Y D R S D A V R E A A D K L Y A D L A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A G I D V I L D D R G E R P G V M F A D W E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G V P H R L V I G E R G L K D G K I E Y Q G R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D A E A T L L P A D S A A T A V A E K V R A A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578
A R
- -
------
Class II
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_pro_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L K F A A M R L S Q M L F V T L R E D P A E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E I P S H K L L L R A G Y I R R I A S G I Y A Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L P L M W R V L R K V S Q I V R E E M D A T G A
- - - - - - V L R K V S Q I V R E E M D A T G A
------------------GTATTACGCAAGGTCTCGCAGATTGTGCGCGAAGAGATGGATGCGACCGGCGCA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q E T L L P Q L Q P A E L W Q E S G R W E T Y T
Q E T L L P Q L Q - - - - - - - - - - - - - - -
CAGGAAACCTTGTTGCCGCAACTGCAA---------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K A E G I M F S L D D R Q Q R Q L G L G P T H E
- - - - - - - - - - - - - - - - - G L G P T H E
---------------------------------------------------GGCTTGGGGCCGACCCACGAG
121122123124125126127128129130131132133134135136137138139140141142143144
E V I T A V A R D L I R S Y R Q L P Q N L Y Q I
E V I T - - - - - - - - - - - - - - Q N L Y Q I
GAAGTGATCACT------------------------------------------CAGAACCTCTATCAAATT
145146147148149150151152153154155156157158159160161162163164165166167168
Q T K F R D E I R P R F G L M R G R E F I M K D
Q T K F R D - - - - - - - - - - - R E F I M K D
CAGACTAAATTCCGGGAT---------------------------------CGGGAATTCATCATGAAGGAC
169170171172173174175176177178179180181182183184185186187188189190191192
A Y S F H A D E E S L R Q T Y A A M D Q A Y R N
A Y S F - - - - - - - - - - Y A A M D Q A Y R N
GCCTACTCCTTC------------------------------TACGCGGCAATGGATCAGGCTTATCGCAAT
193194195196197198199200201202203204205206207208209210211212213214215216
I F R R C G L Q F R A V E A D S G A I G G S A S
I F R - - - - - - - - - - - - - - - - - - - - -
ATCTTCCGG---------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q E F M I L A D A G E D E I L Y T E D G R Y A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N V E K A V S L P A E A I A S A F T T F E K R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
T P G T D T I A S L C E F L K A D P T Q V V K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V L Y Q A V F D N G K L L P I L I S I R G D Q S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V N E I K L T N E L T R R A A D Y G A K T V I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L T V P D A E A L K K W T A A P L P L G Y L G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D L A D S A I A V N E S I I P K F L R L V D P T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A A E L Q N F V T G A N E V N F H V V G A N W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
T N F P K P A V V D L R T A L V G D R A Q H D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
S Q V L A S A R G I E A G H I F Q L G L K Y S Q
- - - - A S A R G I E A G H I F Q L - - - - - -
------------GCATCTGCTCGCGGGATTGAAGCAGGTCACATCTTCCAGTTG------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A M G A T F T T E N G T E E P L W M G C Y G I G
- - - - - - - - - - - - - - - L W M G C Y G I G
---------------------------------------------TTGTGGATGGGCTGCTATGGCATTGGG
481482483484485486487488489490491492493494495496497498499500501502503504
V S R V A Q A A V E Q S Y D K D G I I W P V A I
V S R V A Q A - - - - - - - - - - - - - - - - -
GTGTCGCGGGTGGCTCAGGCT---------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
A P Y Q A V V V I P N I T D T E Q V A A A E K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y A D L T A A G I E T L L D D R D E R A G V K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K D A D L I G I P Y R I V T G R S L K E G K V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
V V Q R A S K E S S V I A V G S V V E T V Q D W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606
I A A A I V
- - - - - -
------------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_pro_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A K E L K D L T K R S E N Y S Q W Y N D L V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K A D L A E Q S A V R G C M V I K P Y G Y A I W
- - - - - - - - - - - - - - - - - - - - - - I W
------------------------------------------------------------------TTCCTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E K M Q R Q L D D M F K E T G H V N A Y F P L L
E K M Q R Q L D D M F K E T G H V N A Y F P L L
CGTCTCCACTGTTCCATCCCAGTGAGCCAGGATAAAGCCGCCTTCTTCGATTTTCTCCTTAAACTCATCATA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I P K S F L S R E A E H V E G F A K E C A V V T
I - - - - - - - - - - - - - - - - - - - - - - -
GCT---------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H Y R L K N A E D G S G V V V D P A A K L E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L I I R P T S E T I I W N T Y K N W I Q S Y R D
- I I R P T S E T I I W - - - - - - - - - - - -
---CTCCATCGTATTGTTCTCCAAGTCACGTCCACC------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L P I L C N Q W A N V F R W E M R T R L F L R T
- - I L C N Q W A N V F R W - - - - - - - - - -
------AAATTTAAAGCCCGGACGTTTATTGTCAGCATTATC------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A E F L W Q E G H T A H A T R E E A E E E A I R
A E F L W Q E G H T A - - - - - - - - - - A I R
TCTTGCCACAATACCTTCTACCTTAGCATCAAT------------------------------AGGAACGAT
193194195196197198199200201202203204205206207208209210211212213214215216
M L N V Y A E F A E K Y M A V P V V K G V K S A
M L N V Y A E F A E - - - - - - - - - - - - - -
CACTACTTGGATCGGAGCCAGATGCGGAGG------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N E R F A G A L D T Y T I E A M M Q D G K A L Q
- - - - - - - - - T Y T I E A - - - - - - - - Q
---------------------------AGAGGTAGCCCATACATA------------------------AAA
241242243244245246247248249250251252253254255256257258259260261262263264
S G T S H F L G Q N F A K A F D V Q F V N K E N
S G T S H F L - - - - - - - - - - - - - - - - -
TTGAACATCGAATGCTTTTGC---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K L E Y V W A T S W G V S T R L M G A L I M T H
- - - - V W A T S W G V S T R L M G A - - - - -
------------CTCGATGGTATACGTGTCAAGTGCACCGGCAAAGCGCTCATTAGC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
S D D N G L V L P P H L A P I Q V V I V P I Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N D E Q L K L I D A K V E G I V A R L K Q L G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S V K Y D N A D N K R P G F K F A D Y E L K G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
P V R L V M G G R D L E N N T M E V M R R D T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E K E T V T C D G I E T Y V Q N L L E E I Q A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I Y K K A R T Y R D S R I T T V D S Y D E F K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K I E E G G F I L A H W D G T V E T E E K I K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E T K A T I R C I P F E S F V E G D K E P G K C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497
M V T G K P S A C R V I F A R S Y
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_pro_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R Q S Q A F I P T L R E V P A D A E V K S H Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L L L R A G F I R Q S A S G V Y T F L P L G Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L Q K I E A I I R E E M N R I G G M E L L M P
V L Q K I E A I I R E E M N R I G G M E L L M P
ATCGCTGTCGGCAAACTTGACTCCGGCCCGCTCCGGGCGGTCATCGTATAACACTTCAAATCCTGCCTGTCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L Q P A E L W Q Q S G R W Y S Y G P E L M R L
A L Q - - - - - - - - - - - - - - - - - - - - -
CAATTTTTC---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K D R H E R D F A L G P T H E E M I T A I V R D
- - - - - - - - A L G P T H E E M I T - - - - -
------------------------CCAGACGAGCCCGTTTTCATCGGCAAACTGCTC---------------
121122123124125126127128129130131132133134135136137138139140141142143144
E V K T Y K R L P L V L Y Q I Q T K F R D E K R
- - - - - - - - - L V L Y Q I Q T K F R D - - -
---------------------------GCCCATGATCATCGTCTTCGTTTGGCCGTTTTCATC---------
145146147148149150151152153154155156157158159160161162163164165166167168
P R F G L L R G R E F M M K D A Y S F H T T K E
- - - - - - - - R E F M M K D A Y S F - - - - -
------------------------CGTGCCAAGCTTGAACACGTGCCCGACTTCAAT---------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L D E T Y N D M Y N A Y S N I F R R C G L N F
- - - - - Y N D M Y N A Y S N I F R - - - - - -
---------------GTCCGGAGACGGATCGCCCTCTTGGACAAAGCGCAAGTC------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R A V I A D S G A I G G K D T H E F M V L S D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G E D T I A Y S D A S D Y A A N I E M A P V V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
T Y E K S S E P P A E L K K V A T P G Q K T I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E V A S Y L Q V S P E R C I K S L L F N V D G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y V L V L V R G D H E A N E V K V K N V L N A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V V E L A T P E E T E R V M G A P V G S L G P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G V S E A V M V I A D H A V A A I V N G V C G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N E E G Y H Y I G V N P D R D F A V S Q Y A D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R F V Q E G D P S P D G K G T I R F A R G I E V
- - - - - - - - - - - - - - - - R F A R G I E V
------------------------------------------------TTCTTTTGTCGTATGGAACGAATA
409410411412413414415416417418419420421422423424425426427428429430431432
G H V F K L G T K Y S E A M N A V Y L D E N G Q
G H V F K L - - - - - - - - - - - - - - - - - -
GGCGTCTTTCATCATGAA------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
T K T M I M G C Y G I G V S R L V A A I A E Q F
- - - M I M G C Y G I G V S R L V A A - - - - -
---------GTACAACACAAGCGGCAGCCGCTTGTACGTTTTCACTTCATCGCGGAC---------------
457458459460461462463464465466467468469470471472473474475476477478479480
A D E N G L V W P A S V A P F H I H L L T A N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K S D E Q R A L A E E W Y E K L G Q A G F E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Y D D R P E R A G V K F A D S D L I G I P V R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T V G K R A G E G I V E V K V R K T G E T F D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567
P V G E L T D T V R R L L Q G
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_pro_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R M K D L Y A P T L K E T P S D V E T V S H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y L L R G G F I R K V A A G I Y T Y L P L G R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L L K I E N I V R E E M N R I G A Q E I L M P
V L L K I E N I V R E E M N R I G A Q E I L M P
TCTTCCCACGTTTATTCTTATGGGAAAGCCTATGAGATCGGCGTCTTTGAATTTGAAACCAGGCGAGACTTC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I L Q P A E L W K Q S G R W D D Y G P E M M K L
I L Q - - - - - - - - - - - - - - - - - - - - -
TCTGTCATC---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K D R H E R D F T L G P T H E E I V T D L V K N
- - - - - - - - T L G P T H E E I V T - - - - -
------------------------GTCCACCACAACGGTGTAAGGGGCGATCGAAAG---------------
121122123124125126127128129130131132133134135136137138139140141142143144
E L R S Y K Q L P L T L Y Q I A N K Y R D E I R
- - - - - - - - - L T L Y Q I A N K Y R D - - -
---------------------------AGCCGCCATCGTTCTGGAAACTCCCCAGCCATAACA---------
145146147148149150151152153154155156157158159160161162163164165166167168
P R F G L L R A R E F I M K D A Y S F H A S W E
- - - - - - - - R E F I M K D A Y S F - - - - -
------------------------ATCCATGAAGTAGGCCTTCATGGCTTCGGAGTA---------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L D E T Y E Q F K K A Y S R I M E R L G V R Y
- - - - - Y E Q F K K A Y S R I M E - - - - - -
---------------CTCTATCCCTTTTGTCGCCTTGAGAGGCTCACCACAGAC------------------
193194195196197198199200201202203204205206207208209210211212213214215216
M I I E A E T G A I G G N A S H E F V V P A K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G E T N V L F C E K C G Y Q A S D E K A E Y K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E Y T Q E Q E E E K P L K K V P T P G V K T I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E V S E F L G V P P S K I V K S L L Y K G R E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y V M V L I R G D L E L N E A K L K A H L K D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S L R M A T P E E I L K D F G V P V G F I G P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G V D V K K V A D H S V R G L K N F V V G G M E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E D T H Y V N A N H P R D F K V D E W Y D L R T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V V E G D P C P V C G E P L K A T K G I E L G H
- - - - - - - - - - - - - - K A T K G I E L G H
------------------------------------------CGCTTTTTTGAACTGTTCGTACGTCTCGTC
409410411412413414415416417418419420421422423424425426427428429430431432
I F K L G T K Y S E A M K A Y F M D E N G E M K
I F K L - - - - - - - - - - - - - - - - - - - -
CAGAGATTCCCA------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P F I M G C Y G W G V S R T M A A V V E H F H D
- F I M G C Y G W G V S R T M A A - - - - - - -
---TGGTCTGATTTCGTCTCTGTACTTGTTCGCTATCTGATACAGAGTGAG---------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E N G M I W P L S I A P Y T V V V D I L N M N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
A E Q K Q V G E K I Y Q V L S E K G E E V V L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D R E V S P G F K F K D A D L I G F P I R I N V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G R S L K E G V V E L K K R Y S K E L V K V N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K N G F G A L L E T L E K M K R E Y D P K E A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577
R
-
---
Class II
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_pro_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R W S R Y F L Y T E K E E P K E A E A P S H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L L L K A G F I K Q V S A G I Y E L L P P A Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L K K V E S I I R K E M D R S G A Q E L L L T
V L K K V E S I I R K E M D R S G A Q E L L L T
TCCCACTAAATCTGCGTCCGCGAATTTAAATCCGGGGCTCTCTTCCCTGTCGTCGAATATTACGTCTATTCC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V L N P K E L W E E T G R W E T Y G E E L F K L
V L N - - - - - - - - - - - - - - - - - - - - -
CTTTTCCTC---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K D R N G R E Y C L G P T H E E E I T D L V R R
- - - - - - - - C L G P T H E E E I T - - - - -
------------------------GGGAGTTGGCCACTTTATCCCTTTATCGTCGTG---------------
121122123124125126127128129130131132133134135136137138139140141142143144
V V R S Y R Q L P V I L Y Q I Q V K F R D E K R
- - - - - - - - - V I L Y Q I Q V K F R D - - -
---------------------------GCCGTAACAGCCCATAATTATGGGTTTTTCCTTTCC---------
145146147148149150151152153154155156157158159160161162163164165166167168
P R F G L I R A R E F I M K D A Y S F D T D D M
- - - - - - - - R E F I M K D A Y S F - - - - -
------------------------CGAGTACCTCGTTCCGAGCAGGAATATGTGTCC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
S A M I S Y E A M K F A Y Q R I F N K L R L N V
- - - - - Y E A M K F A Y Q R I F N - - - - - -
---------------AGAACCACATTTGGGACATGGGTCTCCTTCCCTTACCTC------------------
193194195196197198199200201202203204205206207208209210211212213214215216
I M A E A D V G Q I G G K M S H E F I A F T D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G E A K V A Y C E N C G Y A A N A E I V P L P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P E E E K E E E K P M E K V H T P N V H T I E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L S K F L D V H P S K I M K A V L Y I V N E K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
P V L V L I R G D R E I D E N K L E K V L G T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N F R L A T D E E V Q E L L G T K K G F I G I F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N L P E N I K V L W D N S L Y G V K N L V V A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N E P D W H Y I N V N P G R D F Q Y G E F V D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A E V R E G D P C P K C G S P L K V R R G L E L
- - - - - - - - - - - - - - - - K V R R G L E L
------------------------------------------------CATCGCGGACATATCGTCCGTATC
409410411412413414415416417418419420421422423424425426427428429430431432
G H I F L L G T R Y S E P M K A Y F T D R D G K
G H I F L L - - - - - - - - - - - - - - - - - -
AAAAGAGTAAGCGTCCTT------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E K P I I M G C Y G I G V S R I L A A L V E Q Y
- - - I I M G C Y G I G V S R I L A A - - - - -
---------CTGTATTTGATAAAGAATTACGGGAAGCTGTCTGTATGAACGAACTAC---------------
457458459460461462463464465466467468469470471472473474475476477478479480
H D D K G I K W P T P V A P F E L D I I L L N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K D E E M K N V A E K L Y L E A E E K G I D V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F D D R E E S P G F K F A D A D L V G F P Y R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V V G K K V K E G K V E V Q S R H T G E K W D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570
E I E K A I D F V K E K I E E D K K
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Gemmata obscuriglobus/amino acid sequences/Gemmata_pro_aa
Bacteria/Gemmata obscuriglobus/nucleotide sequences/Gemmata_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A D V I T P R A R N Y S Q W Y L D I V K E A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A D N S D V R G C M V I K P T G Y A L W E K M
- - - - - - - - - - - - - - - - - - - L W E K M
---------------------------------------------------------TTCCGTCTCGCGCGT
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q R A L D R L F K D T G H V N A Y F P L F I P M
Q R A L D R L F K D T G H V N A Y F P L F I - -
GCCGTCCCAGTGGGCGTACACGAACTTCAGCGGCTCCGTGCCCGCTTCCGCAGCCTCCTCGCGCGC------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S F L A K E E Q M A E G F A K E C A V V T H Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K A E P G K P L H V D P A A E L E E P L I I R
- - - - - - - - - - - - - - - - - - - - - I I R
---------------------------------------------------------------GCCGAACTG
121122123124125126127128129130131132133134135136137138139140141142143144
P T S E T I I W N T Y K K W V Q S Y R D L P L L
P T S E T I I W - - - - - - - - - - - - - - L L
CTTCCCCTCTTTTCCGGGTACGTC------------------------------------------CCCGAT
145146147148149150151152153154155156157158159160161162163164165166167168
I N Q W A N V V R W E M R T R L F L R T A E F L
I N Q W A N V V R W - - - - - - - - - - A E F L
CTCCACGCGAACGGGCACCCCGCGGACCTC------------------------------GTCGAACAGCGT
169170171172173174175176177178179180181182183184185186187188189190191192
W Q E G H T A H A T A Q E A E A E T L Q M V R V
W Q E G H T A - - - - - - - - - - T L Q M V R V
GTCGATCTTCACGCTGATCGG------------------------------CGCACGCAGCTCGGTCGCGAG
193194195196197198199200201202203204205206207208209210211212213214215216
Y Q K F A E E W M A M P V L V G P K T D G Q K F
Y Q K F A E - - - - - - - - - - - - - - - - - -
CTTTTCCGCAGCGGCGAT------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P G A V Y T L C I E A M M Q D G K A L Q A G T S
- - - - - T L C I E A - - - - - - - - Q A G T S
---------------GGGGATTACGAGCCCGTT------------------------GCCGCCGATGAGCCG
241242243244245246247248249250251252253254255256257258259260261262263264
H F L G Q N F A K A F D V K F K D K E N K E E F
H F L - - - - - - - - - - - - - - - - - - - - -
CGTGCTCAC---------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A W A T S W G V S T R L I G G L I M T H S D D N
A W A T S W G V S T R L I G G - - - - - - - - -
TGCCTTCGCGAAATTCTGGCCCAAGAAGTGCGACGTTCCGGCCTG---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G L V I P P R L A A T H V V I V P L G K N D A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R G P S I A A A E K L A T E L R A L P R D D F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G Y E P I S V K I D T L F D K Q P G F R Y A E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E V R G V P V R V E I G P K D I E K G A C A V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R R D V P G K E G K Q F G I P L T G A A E H I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K L L R D I Q A S L Y N R A K A F R D S R I V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A N T L D E F K A L F P A R E E A A E A G T E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L K F V Y A H W D G T R E T E E S V Q K E F A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
T I R C L P F D G P Q E A G T C I F T G K P S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513
R R V V F A R A Y
- - - - - - - - -
---------------------------
Class II
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_pro_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A E K A D A L K I T R R D E D Y S R W Y L D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V D R A K L A E D S G I R G C M I I R P E G F A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I W E K M Q Q T L D G M F K D T G H T N A Y F P
I W E K M Q Q T L D G M F K D T G H T N A Y F P
ATTTGGGAGAAAATGCAGCAAACCCTGGACGGAATGTTTAAAGACACCGGACACACGAATGCTTACTTTCCG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V F I P V S Y F S K E A E H V S G F A K E C A V
V F I - - - - - - - - - - - - - - - - - - - - -
GTATTTATT---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V T H H R L Q L T E S G E I T V D P D A E L S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P L V V R P T S E T I I W S A Y R N W I Q S Y R
- - V V R P T S E T I I W - - - - - - - - - - -
------GTTGTCAGACCGACTAGCGAAACTATTATTTGG---------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D L P I L L N Q W A N I C R W E L R T R P F L R
- - - I L L N Q W A N I C R W - - - - - - - - -
---------ATTCTGTTGAATCAATGGGCAAATATTTGTCGCTGG---------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T T E F L W Q E G H T A H A T A D E A E A E A R
- T E F L W Q E G H T A - - - - - - - - - - A R
---ACCGAATTTCTTTGGCAAGAAGGACATACAGCT------------------------------GCAAGG
193194195196197198199200201202203204205206207208209210211212213214215216
Q M L E I Y K T F V E Q Y L A I P V F A G R K T
Q M L E I Y K T F V E - - - - - - - - - - - - -
CAAATGTTAGAAATTTACAAAACTTTTGTCGAG---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E N E K F P G A V H T Y T I E T M T Q D K R A I
- - - - - - - - - - T Y T I E T - - - - - - - -
------------------------------ACTTATACAATCGAAACA------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Q V G T S H N L G T T F S K A F D V K Y L S A E
Q V G T S H N L - - - - - - - - - - - - - - - -
CAAGTCGGTACGAGCCACAATTTA------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G T Q E Y P F A T S W G I T T R M I G T L I M V
- - - - - P F A T S W G I T T R M I G T - - - -
---------------CCATTTGCAACGAGTTGGGGCATTACAACTAGAATGATCGGTACT------------
289290291292293294295296297298299300301302303304305306307308309310311312
H S D D R G F V C P P R I A P L Q V I G V P I Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R K D A E K E Q V L A R F T E L Q E Q F K A T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A F S F K V D T R D N L S P G F K F N D W E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
G I P L R L E M G P R D L A N G T A V L V R R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T G E K I N V A Q T D L E S Q I K T L L E D I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I S L F K R A Q E F Q Q Q N L H F V E T Y A E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q Q Q I E E K A G F Y V A Y F D G N S D D E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I K E E T K A T G R C I P F D L Q Q G T G K C F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496
Y T G R Q T D R R V I F A R A Y
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_pro_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R Q S R T L I P T L R E V P T D A E A K S H Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L L L R A G F I R Q N T S G V Y S Y M P L A N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V I H K I Q S I V R Q E M E K I N A V E M L M P
V I H K I Q S I V R Q E M E K I N A V E M L M P
GTCATTCATAAAATCCAGAGCATTGTCCGCGAAGAAATGGAGAAAATCAATGCCGTCGAAATGCTGATGCCG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L Q Q A E T W Q E S G R W Y T Y G P E L M R L
A L Q - - - - - - - - - - - - - - - - - - - - -
GCGCTCCAG---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K D R H G R E F A L G A T H E E V I T S I V R D
- - - - - - - - A L G A T H E E V I T - - - - -
------------------------GCCCTAGGCGCAACACACGAAGAGGTCATCACA---------------
121122123124125126127128129130131132133134135136137138139140141142143144
E V K S Y K R L P L T L Y Q I Q S K F R D E K R
- - - - - - - - - L T L Y Q I Q S K F R D - - -
---------------------------CTGACCCTTTACCAGATCCAATCGAAGTTCCGCGAT---------
145146147148149150151152153154155156157158159160161162163164165166167168
P R F G L L R G R E F I M K D A Y S F H S S A E
- - - - - - - - R E F I M K D A Y S F - - - - -
------------------------CGGGAATTCATCATGAAGGATGCGTATTCCTTC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L D E T Y N D M Y Q A Y T N V F T R C G L N F
- - - - - Y N D M Y Q A Y T N V F T - - - - - -
---------------TACAATGATATGTATCAGGCGTATACGAATGTGTTTACG------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R P V I A D S G A M G G K D T H E F M A L S D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G E D T I A Y S D Q S S Y A A N I E M A E V K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A G A G E K A E M K E L Q E V H T P S V K T I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E V A A F L G I S P S D C V K S M L M K A D G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F V L V L T R G D H E V N D I K V K N L L Q A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
T I E F A S A E E V A E I T G T E P G F V G P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G L D S E I E I F A D F A V K A M A N A A A G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N K T D Y H Y Q N V N I S R D V H N V T F A D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R L I Q E G D P S P D G N G T I R F A K G I E V
- - - - - - - - - - - - - - - - R F A K G I E V
------------------------------------------------CGTTTTGCAAAAGGAATCGAAGTC
409410411412413414415416417418419420421422423424425426427428429430431432
G Q V F K L G T R Y S E A M D A T Y L D E N G R
G Q V F K L - - - - - - - - - - - - - - - - - -
GGACAAGTCTTTAAGCTC------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A Q P M L M G C Y G I G I S R T L S A I V E Q H
- - - M L M G C Y G I G I S R T L S A - - - - -
---------ATGCTGATGGGCTGCTATGGAATCGGGATTTCCCGGACGCTTTCGGCC---------------
457458459460461462463464465466467468469470471472473474475476477478479480
H D D K G L I W P L E V T P Y D L H I L A L N M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K N D A Q V Q L A E K L Y E D F K A N G Y D V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
F D D R A E R A G V K F A D S D L I G L P I R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
T V G K R A D E G V V E V K I R K T G E S F E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572
A A E E L L D F I E K Q V K S L S S H S
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_pro_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S D F I A S K E D D Y S K W Y L D I V Q K A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A D Y S P V K G C M V I M P Y G Y S I W S K I
- - - - - - - - - - - - - - - - - - - I W S K I
---------------------------------------------------------AATAATATTTTCACA
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q S I L D K K F K E T G H E N A Y F P M L I P Y
Q S I L D K K F K E T G H E N A Y F P M L I - -
ATTCAAACTGCCACACCAACAAGAAAGCACAAATCCAGAATAATCATTCACATAGGCTTTGAATGT------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S F L E R E K D H I D G F S P E F A I I K D A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G E S L A E P L V L R P T S E T I I W N M Y S K
- - - - - - - - V L R P T S E T I I W - - - - -
------------------------CTTAACCTTGCTTATAAGAGAATCAAGTGATAT---------------
121122123124125126127128129130131132133134135136137138139140141142143144
W I K S Y R D L P L K I N Q W A N V V R W E K R
- - - - - - - - - L K I N Q W A N V V R W - - -
---------------------------AACGGAATTTAAAAGGACATCATTTATCCCCACTTC---------
145146147148149150151152153154155156157158159160161162163164165166167168
T R P F L R T T E F L W Q E G H T A H A T E E E
- - - - - - - T E F L W Q E G H T A - - - - - -
---------------------AGATGAAAATCTAAATCCCGGAGAACTTCTAAC------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A L E E T L L I L D V Y K R F I E D Y L A I P V
- - - - T L L I L D V Y K R F I E - - - - - - -
------------TTTTTTTAAAGCATCCACAACACAATCAGAATAATCTAA---------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F C G K K S E K E K F A G A V S T Y S I E A L M
- - - - - - - - - - - - - - - - T Y S I E A - -
------------------------------------------------AGGCGGCAAAACTAAACC------
217218219220221222223224225226227228229230231232233234235236237238239240
Q D K K A L Q A A T S H Y L G L N F A K A F D V
- - - - - - Q A A T S H Y L - - - - - - - - - -
------------------CAAAGCACCAATCAATCTGGTAGA------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K F Q D K D G K M R H V F A S S W G V S T R L I
- - - - - - - - - - - V F A S S W G V S T R L I
---------------------------------AAATGCCTTTGCAAAATTTAAACCTAAATAATGGGATGT
265266267268269270271272273274275276277278279280281282283284285286287288
G A L I M V H S D E K G L V L P P R I A P I E I
G A - - - - - - - - - - - - - - - - - - - - - -
AGCGGC------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I V I P I F K K E D E I N K K I L D Y S D C V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
D A L K K A E F R V E I D K D V R S S P G F R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
S S A E F K G I P I R L E V G I N D V L L N S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T I S R R D K D R K F K Y Q I S L D S L I S K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K V E L D L M Q K D L F Q R A L N F R I L N T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E I F R S S K D S Y E T F K A Y V N D Y S G F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L S C W C G S L N C E N I I K N E T K A T I R C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
I P D D F K A R D L T G M T C I Y C S S K A K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488
F V L F A K S Y
- - - - - - - -
------------------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_pro_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H K K L P T R A E N F S E W Y N E I I K R A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A E N A A V R G C M T I R P Y G F A I W E K M
- - - - - - - - - - - - - - - - - - - I W E K M
---------------------------------------------------------ATATGGGAAAAAATG
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q A I L D K A F K A T G H E N A Y F P I F I P K
Q A I L D K A F K A T G H E N A Y F P I F I - -
CAAGCCATATTAGATAAAGCGTTTAAAGCAACAGGCCATGAGAATGCTTATTTTCCTATTTTCATA------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S Y L N R E A A H V E G F A K E C A V V T H Y R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K A T E D G Q Q V V V D P S A K L E E E L I V
- - - - - - - - - - - - - - - - - - - - - - I V
------------------------------------------------------------------ATTGTA
121122123124125126127128129130131132133134135136137138139140141142143144
R P T S E T I I W N S Y K N W I Q S Y R D L P L
R P T S E T I I W - - - - - - - - - - - - - - L
CGGCCCACCTCAGAAACCATTATTTGG------------------------------------------TTA
145146147148149150151152153154155156157158159160161162163164165166167168
L I N Q W C N V V R W E M R T R L F L R T A E F
L I N Q W C N V V R W - - - - - - - - - - A E F
CTAATCAACCAGTGGTGCAATGTGGTACGCTGG------------------------------GCTGAGTTT
169170171172173174175176177178179180181182183184185186187188189190191192
L W Q E G H T A H A T Q A E A E Q E A L Q M L N
L W Q E G H T A - - - - - - - - - - A L Q M L N
TTATGGCAAGAGGGGCACACAGCC------------------------------GCATTACAGATGTTAAAT
193194195196197198199200201202203204205206207208209210211212213214215216
I Y A D F G K D Y L A I P F L K G I K T E H E R
I Y A D F G K - - - - - - - - - - - - - - - - -
ATCTATGCTGATTTTGGAAAA---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F A G A E E T Y T I E A L M Q D G K A L Q A G T
- - - - - - T Y T I E A - - - - - - - - Q A G T
------------------ACGTATACTATAGAGGCT------------------------CAGGCAGGCACT
241242243244245246247248249250251252253254255256257258259260261262263264
S H F L G Q R F A K A F E V T F T N Q A G Q L D
S H F L - - - - - - - - - - - - - - - - - - - -
TCTCATTTTTTA------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y V W G T S W G L T T R L I G A L V M T H S D D
- V W G T S W G L T T R L I G A - - - - - - - -
---GTATGGGGCACTTCTTGGGGCCTTACTACTCGTTTGATAGGTGCC------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K G L V L P P R V A P I Q I V I I P I Y R T Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E K E A I Q Q Q A Q H I Q Q Q L I A H N I S A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L D G R D E H K P G W K F A E Y E L K G V P I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
M A I G P N D L A N N T V E L T R R D T S E K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T V P T D N I I V V V K S M L D S I H D N L Y Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R A Y E F R E Q N T Y Q V N S Y E E F K T A I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q K R G F I L A H W D G T K E T E R Q I H A E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K A T I R C I P L E V N T E P G V C I Y T G K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491
S K Q R V V F G Q A Y
- - - - - - - - - - -
---------------------------------
Class II
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_pro_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T K D G G K K D N Q G Q D K K A Q Q Y G V T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q S V D F N D W Y N E V V K K A D L A D N S P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A G A M V V R P Y G S A L W E N I Q R W L D D R
- - - - - - - - - - - - L W E N I Q R W L D D R
------------------------------------CTGTGGGAAAACATTCAGCGCTGGCTCGACGACCGC
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F K A S G H E S L I F P T L I P M N F I M K E A
F K A S G H E S L I F P T L I - - - - - - - - -
TTCAAGGCGAGCGGGCACGAATCGCTGATCTTCCCGACCCTCATT---------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D H V E G F A P E L F T V N K I G T E E L A E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y V M R P T S E T I I G H M W S G W L N S Y R D
- V M R P T S E T I I G - - - - - - - - - - - -
---GTGATGCGCCCGACCTCCGAGACGATCATCGGG------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L P F L H Y Q W G S V F R A E L R T K A F L R T
- - F L H Y Q W G S V F R A - - - - - - - - - -
------TTCCTGCACTACCAGTGGGGCAGCGTGTTTCGCGCC------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S E F F W H E G H T A H A D E A E A R A E V R Q
S E F F W H E G H T A - - - - - - - - - - V R Q
TCCGAGTTTTTCTGGCACGAGGGCCACACCGCC------------------------------GTGCGCCAG
193194195196197198199200201202203204205206207208209210211212213214215216
Q L D L Y H E F C R D V L A L P V V R G E K T A
Q L D L Y H E F C R - - - - - - - - - - - - - -
CAACTCGACCTGTACCACGAGTTCTGCCGC------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S E R F A G A V A T Y S I E G M M R D G K A L Q
- - - - - - - - - T Y S I E G - - - - - - - - Q
---------------------------ACCTACTCCATCGAGGGC------------------------CAA
241242243244245246247248249250251252253254255256257258259260261262263264
S G T S H Y L G Q N F S R A F D V K Y Q T R E Q
S G T S H Y L - - - - - - - - - - - - - - - - -
TCGGGCACCTCGCACTACCTC---------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K E E F A H T T S W A I S S R I I G A I I M T H
- - - - A H T T S W A I S S R I I G A - - - - -
------------GCGCACACGACCTCCTGGGCCATCTCCAGCCGCATCATCGGGGCC---------------
289290291292293294295296297298299300301302303304305306307308309310311312
G D D S G L M M P P R I A P I Q V V V I P V G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K D N F D Q M V Q E G E K L A A E L R A Q G L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V K V D G R D G V T N G F K Y N D W E L K G V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V R I E L G P R D L E S G V L V V K N R H S E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
K E T L P R A E A V S G M S A R L D T I H D F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
M K R A T D F L L A N T A E V D S Y D A F Q R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I E A G H W V R A Y H C G E P A C E K S I K E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
T K A T A R N V P F D D A E F F A E R G E G Q C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499
V K C G Q P S A Y G K R V L F G R Q Y
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_pro_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K Q S K V F I P T M R D V P S E A E A Q S H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L L L K A G L I K Q S T S G I Y S Y L P L A T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L N N I T A I V R Q E M E R I D S V E I L M P
V L N N I T A I V R Q E M E R I D S V E I L M P
GTGTTAAATAATATTACTGCAATTGTGCGACAAGAAATGGAACGTATCGATTCTGTTGAAATTTTAATGCCA
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L Q Q A E L W E E S G R W G A Y G P E L M R L
A L Q - - - - - - - - - - - - - - - - - - - - -
GCGTTACAA---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q D R H G R Q F A L G P T H E E L V T S I V R N
- - - - - - - - A L G P T H E E L V T - - - - -
------------------------GCATTAGGTCCAACACATGAAGAATTAGTTACA---------------
121122123124125126127128129130131132133134135136137138139140141142143144
E L K S Y K Q L P M T L F Q I Q S K F R D E K R
- - - - - - - - - M T L F Q I Q S K F R D - - -
---------------------------ATGACATTATTCCAAATTCAATCTAAATTCCGTGAT---------
145146147148149150151152153154155156157158159160161162163164165166167168
P R F G L L R G R E F I M K D A Y S F H A D E A
- - - - - - - - R E F I M K D A Y S F - - - - -
------------------------CGTGAATTTATTATGAAAGATGCGTATTCATTC---------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L D Q T Y Q D M Y Q A Y S R I F E R V G I N A
- - - - - Y Q D M Y Q A Y S R I F E - - - - - -
---------------TATCAAGATATGTATCAAGCGTATAGCCGTATTTTTGAG------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R P V V A D S G A I G G S H T H E F M A L S A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G E D T I V Y S K E S D Y A A N I E K A E V V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E P N H K H T T V Q P I E K I E T P N V K T A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E L A D F L G R P V D E I V K T M I F K V D G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Y I M V L V R G H H E I N D I K L K S Y F G T D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
N I E L A T Q D E I V N L V G A N P G S L G P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I D K E I K I Y A D N F V Q D L N N L V V G A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E D G Y H L I N V N V G R D F N V D E Y G D F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F I L E G E K L S D G S G V A H F A E G I E V G
- - - - - - - - - - - - - - - H F A E G I E V G
---------------------------------------------CATTTTGCTGAAGGAATTGAAGTTGGT
409410411412413414415416417418419420421422423424425426427428429430431432
Q V F K L G T K Y S E S M N A T F L D N Q G K A
Q V F K L - - - - - - - - - - - - - - - - - - -
CAAGTATTCAAATTG---------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q P L I M G C Y G I G I S R T L S A I V E Q N H
- - L I M G C Y G I G I S R T L S A - - - - - -
------TTAATTATGGGTTGTTACGGTATTGGAATTTCTAGAACGCTAAGTGCG------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D D N G I V W P K S V T P F D L H L I S I N P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K D D Q R E L A D A L Y A E F N T K F D V L Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D R Q E R A G V K F N D A D L I G L P L R I V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
G K R A S E G I V E V K E R L T G D S E E V H I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567
D D L M T V I T N K Y D N L K
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_pro_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R G G R L L G P P H A C F S L L S N S V S C L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S S S R A S H R S I T R H L G V R H H L P S S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P R T P S Y S T S P V T P V T P T R G Y S G T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I H T Q N K S P P A S S L P H M S I E D C R G F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H E V K A L L Q E L G L D I P I V H H D E K A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V E E V L D L L H K M G I H A A G T K T L F L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S K K G E L V M A T A F K S T P T D L K F I Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V T N A K D L R F A S S E V L Q E C L A V V Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C V T P F A L I N N I E K R P I T L L I D R S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E A S T L P L A F C L C R N D Y T A V I T F E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L K K Y L E K L G H A Y K L V D F G A A S A D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A V T G G A A A P A P K P K K A P A D A A A A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A A P A S A Q S G E T K L G I A A K R E E N F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A W Y I D V I T K A E M I E Y Y D V S G C Y I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R P W A Y Y V W K C V Q R F L G G K I E K L G V
- - - - - - V W K C V Q R F L G G K I E K L G V
------------------GTGTGGAAGTGCGTGCAGCGCTTCCTTGGTGGGAAGATCGAGAAGCTTGGCGTG
361362363364365366367368369370371372373374375376377378379380381382383384
E D C Y F P M F V S R N C L E R E K D H I E G F
E D C Y F P M F V - - - - - - - - - - - - - - -
GAGGACTGCTACTTCCCGATGTTCGTG---------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
A P E V A W V T R A G D T E L E Q P V A V R P T
- - - - - - - - - - - - - - - - - - - A V R P T
---------------------------------------------------------GCCGTGCGGCCGACG
409410411412413414415416417418419420421422423424425426427428429430431432
S E T V M Y P Y Y A K W I R S H R D L P V R L N
S E T V M Y - - - - - - - - - - - - - - V R L N
AGCGAGACGGTGATGTAC------------------------------------------GTGCGGCTGAAC
433434435436437438439440441442443444445446447448449450451452453454455456
M W N N V I R W E F S H P T P F I R T R E F L W
M W N N V I R W - - - - - - - - - - - R E F L W
ATGTGGAACAACGTGATCCGGTGG---------------------------------CGCGAGTTCCTGTGG
457458459460461462463464465466467468469470471472473474475476477478479480
Q E G H C A W A K A E E C A K E V L D I L E C Y
Q E G H C A - - - - - - - - - - V L D I L E C Y
CAGGAGGGGCACTGTGCG------------------------------GTGCTGGACATCCTGGAGTGCTAT
481482483484485486487488489490491492493494495496497498499500501502503504
A S V Y E Q L L A V P V V R G R K T E K E K F A
A S V Y E - - - - - - - - - - - - - - - - - - -
GCATCGGTGTACGAG---------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G G D Y T T T V E T F I E A V G R G C Q G A T S
- - - - T T T V E T - - - - - - - - - Q G A T S
------------ACGACGACGGTGGAGACG---------------------------CAGGGCGCGACGAGC
529530531532533534535536537538539540541542543544545546547548549550551552
H N L G Q N F G K M F D I R F Q D P E N N E Q T
H N L - - - - - - - - - - - - - - - - - - - - -
CACAACCTG---------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L I P W Q N S W G L S T R V I G V M I M V H G D
- - P W Q N S W G L S T R V I G V - - - - - - -
------CCGTGGCAGAACAGCTGGGGGCTGTCGACGCGCGTGATCGGCGTG---------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N R G M V M P P R V A S T Q V I I I P V G I T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D T T E E A R Q E L L A S C R R L E S E L C E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G V R A K C D L R D N Y S P G W R F N H W E V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
G V P L R V E L G P R E L A E R S L A V A V R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
S G A R H S V V W D A Q T P T A V A A L L E D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
H A Q M Y A R A K E T M E T H R V R V T E W A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
F V P T L N R K C L I L A P W C G A M E C E D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V K K D S A E E S K A A Q A Q E T R E D A R A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788789790791792
S M G A K T L C I P F E Q P E D P A E G H G C I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
793794795796797798799800801802803804805806807808809810
C K G C T K P A T T W V L F G R S Y
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_pro_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
L F K K K K P S K N K F I K S T K R N N K Q L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V I E F K I K M S V D E K L Y S E V L D Q L S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L S I N Y S K F D H D A T P N M E S M V E V L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E Q A E K H N T D F A K N L L I K S K G N E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F F V L A H H E T D T K M K N L G Q I F G V S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N K L R L A D E D V L N D T L K V K R G C L T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L S L I F E K S G G I Q V Y F D E C L K D K K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F V H P L T N T E S F S I H I N D I V K F A E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
C G K K V K W F S M D N L E E Q K P A G K P E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S K E N E S L L G I T A D K I T S F A D W Y S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V I V K S E M I E Y Y D I S G C Y I L R P W S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F I W E T I Q S V F D Q K I K Q H D V Q N A Y F
- I W E T I Q S V F D Q K I K Q H D V Q N A Y F
---ATTTGGGAAACAATTCAAAGCGTTTTCGATCAGAAAATCAAACAACATGATGTACAAAATGCCTATTTC
289290291292293294295296297298299300301302303304305306307308309310311312
P I F V T Q K K L E T E K D H V E G F S P E V A
P I F V - - - - - - - - - - - - - - - - - - - -
CCCATTTTTGTA------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
W V T K S G K S D L A E P I A I R P T S E T I M
- - - - - - - - - - - - - - A I R P T S E T I M
------------------------------------------GCTATCCGTCCAACATCTGAAACAATCATG
337338339340341342343344345346347348349350351352353354355356357358359360
Y P Y F A K W I R S H R D L P L K I N Q W T S I
Y - - - - - - - - - - - - - - L K I N Q W T S I
TAT------------------------------------------CTTAAGATTAATCAATGGACTTCCATT
361362363364365366367368369370371372373374375376377378379380381382383384
V R W E F K H P T P F I R T R E F L W Q E G H T
V R W - - - - - - - - - - - R E F L W Q E G H T
GTAAGATGG---------------------------------CGTGAATTTTTATGGCAAGAAGGACATACA
385386387388389390391392393394395396397398399400401402403404405406407408
A H S T R K E A L E M V D I I L N E Y A S I Y E
A - - - - - - - - - - V D I I L N E Y A S I Y E
GCC------------------------------GTTGACATCATTTTAAATGAATATGCATCTATTTATGAA
409410411412413414415416417418419420421422423424425426427428429430431432
D L L A T P V V K G T K S E N E K F P G G D I T
- - - - - - - - - - - - - - - - - - - - - - - T
---------------------------------------------------------------------ACT
433434435436437438439440441442443444445446447448449450451452453454455456
K S I E G F I P E I G R A V Q A A T S H L L G Q
K S I E G - - - - - - - - - Q A A T S H L L - -
AAATCAATTGAAGGA---------------------------CAGGCTGCAACTTCTCATTTACTT------
457458459460461462463464465466467468469470471472473474475476477478479480
N F S K M F G V E F E D E K G N K E Y A H Q T S
- - - - - - - - - - - - - - - - - - - A H Q T S
---------------------------------------------------------GCACATCAAACTTCT
481482483484485486487488489490491492493494495496497498499500501502503504
W G L T T R A I G V M I M T H G D N K G L V L P
W G L T T R A I G V - - - - - - - - - - - - - -
TGGGGCTTAACTACAAGAGCTATTGGTGTT------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P K V A P V Q V I I I P I I F K T V I T E E Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K I C N E V E C I L K K A G V R V K I D D R S N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y T P G W K Y N H W E V K G V C L R F E V G P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D I E K R S V R V V V R D N M E K M D I P I S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L E S K I P K L L E E F Q N R L L F K A K Q R Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
N E S I I R V D T F D K V M D T L N Q K K M V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
A P W C E D V S C E E E I K K E T A R L S L D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
E D N Q S M T G A M K S L C I P N D Q I F K I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719
E G K T K C F F C D K L A K K F T L F G R S Y
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Eukaryotes/Coccomyxa subellipsoidea/amino acid sequences/Csubellipsoidea_pro_aa
Eukaryotes/Coccomyxa subellipsoidea/nucleotide sequences/Csubellipsoidea_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L P S N R W Y L D V V R D A E L A D Y G P V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G T M V I R P Y G Y A I W E G I Q S Y L D S R F
- - - - - - - - - - - I W E G I Q S Y L D S R F
---------------------------------ATATGGGAAGGCATACAGTCGTACCTGGACTCGCGGTTC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K E L G V Q N A Y F P Q L I P L S F L Q K E A D
K E L G V Q N A Y F P Q L I - - - - - - - - - -
AAGGAGCTGGGCGTGCAGAACGCGTACTTCCCGCAGCTCATC------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H V E G F A P E L A L V T K G G G K D L E E P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V V R P T S E T M V N H M L A Q W I Q S Y R D L
V V R P T S E T M V N - - - - - - - - - - - - -
GTGGTACGGCCGACGTCTGAGACGATGGTGAAC---------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P M L L N Q W A N V H R W E L R T R P F I R T L
- M L L N Q W A N V H R W - - - - - - - - - - L
---ATGCTGCTCAACCAGTGGGCCAACGTGCACCGCTGG------------------------------CTC
145146147148149150151152153154155156157158159160161162163164165166167168
E F L W Q E G H T A H A T A E E A K A M A Q Q M
E F L W Q E G H T A - - - - - - - - - - A Q Q M
GAATTCCTCTGGCAGGAGGGCCACACCGCC------------------------------GCCCAGCAGATG
169170171172173174175176177178179180181182183184185186187188189190191192
V E V Y A D F A I N C A A M P V I P G R K S R I
V E V Y A D F A I - - - - - - - - - - - - - - -
GTGGAGGTTTATGCTGACTTTGCAATC---------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E S F A G A N V T L T I E A M M G D R R A L Q A
- - - - - - - - T L T I E A - - - - - - - - Q A
------------------------ACCCTCACCATTGAGGCT------------------------CAGGCG
217218219220221222223224225226227228229230231232233234235236237238239240
G T S H D L G D N F A R A F G T Q F L D E S G E
G T S H D L - - - - - - - - - - - - - - - - - -
GGCACGAGCCATGATCTT------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L V H P Q Q T S W G A S T R L I G G I I M T H G
- - - P Q Q T S W G A S T R L I G G - - - - - -
---------CCGCAGCAGACAAGCTGGGGTGCCAGCACACGCCTCATTGGCGGC------------------
265266267268269270271272273274275276277278279280281282283284285286287288
D D M G L R L P P R L A P I Q V V I V P I L K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N T D T E A V L A A A D A L A E A A K A A G L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A K V D A G T E K T P G F K F S Y W E M K G V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V R I E V G P R D V A Q G T C V A A R R D R P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K E G K Q F G I P L E P A G F V A S M R Q L L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D V H D G L L A E A T A F R D A N I V D V E S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D N L K A A I E A G K W A R G R W A G S D E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K R I K E E T T A T L R C I P F D Q P G G S G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474
C F L T G A D A A E V A I F A K A Y
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_pro_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R V S H L M L V T L R D D P A E A E V I S H K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L L L R A G Y I R R V T I G I Y A Y L P L L W R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V L K K I S S C V R E E M T S A G A I E L L M P
V L K K I S S C V R E E M T S A G A I E L L M P
TATTTGCCAAGGTATACCAATTAAATCAGCATCTTTGAATTTTACGCCTGCTCTATCTTGACGGTCATCAAT
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q L Q P A D I W Q L S K R W A G Y T Q G E G I M
Q L Q - - - - - - - - - - - - - - - - - - - - -
CAAGACATC---------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F N L K D R Q G R E L A L G P T H E E V V T N L
- - - - - - - - - - - A L G P T H E E V V T - -
---------------------------------TGCTATTGATAAAGGCCAACAAATTCCTTTTTG------
121122123124125126127128129130131132133134135136137138139140141142143144
V D N L I K S Y R Q L P C T L Y Q I Q T K F R D
- - - - - - - - - - - - C T L Y Q I Q T K F R D
------------------------------------ACCAATTCCATAGCAACCCATCCAAAACGGTTCTTG
145146147148149150151152153154155156157158159160161162163164165166167168
E I R P R F G L M R S R E F V M K D A Y S F H S
- - - - - - - - - - - R E F V M K D A Y S F - -
---------------------------------GGCTATTGAATACTTATGTCCTAAACGAAAAAT------
169170171172173174175176177178179180181182183184185186187188189190191192
S E I D L K V S Y D R M D L G Y R N I F R R C G
- - - - - - - - Y D R M D L G Y R N I F R - - -
------------------------TAATGTATAGATAGGATTATGAATACATTGGTCATTAGC---------
193194195196197198199200201202203204205206207208209210211212213214215216
L N V V A V E A D S G S I G G A A S Q E F M V T
- - - - - - - - - - - - - - - - - S Q E F M V -
---------------------------------------------------AATAAGATGCTTGTTATC---
217218219220221222223224225226227228229230231232233234235236237238239240
A E A G E D L I L I S E D K S Y A A N Q E R A I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
S L P K I A F I S E N R G C Q Y L S T P K Q T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I D Q L C Q A H G L H S S Q I V K V L L M L A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F S N C T P I P I L V S L R G D Q N L N E V K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
I S A V K S H V S S K V G T L L E I T P I T P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G A I N Q G V N N I P F G Y L G P Q L D D K V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L G A K D W Q K R F L R F V D P T A A A L T Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V C G A N I D N K H L I G A S W G D L F I L P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Q V D L R A A Q A N D Q C I H N P I Y T L T E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R G I E V G H I F R L G H K Y S I A L N A N Y T
- - - E V G H I F R L - - - - - - - - - - - - -
---------CTCGCTGGAATGAAATGAATAAGC---------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N E I G N Q E P F W M G C Y G I G I S R L S Q A
- - - - - - - - F W M G C Y G I G I S R L S Q A
------------------------TTTTGTCTGTATTTGATACAAGGTACAAGGAAGCTGACGATAAGATTT
481482483484485486487488489490491492493494495496497498499500501502503504
A V E Q H H D Q K G I C W P L S I A P F E V I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V I V S I Q D E I Q R T L G E A L Y S I M K A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R V D V L I D D R Q D R A G V K F K D A D L I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I P W Q I V I G R G A I N N Q I E L V E R I T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R S E Q L D A G Y L V K Y F L Q Y L E R T H N I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604
F L G D
- - - -
------------
Class II
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_pro_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_pro_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M A K Q K F G L T V N K A E N F S S W Y T Q V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V K G E F L D Y Y D V K G C Y I L R P N G Y F I
- - - - - - - - - - - - - - - - - - - - - - - I
---------------------------------------------------------------------ATC
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W N E I R K W F T N E I E K L G V E E C L F P M
W N E I R K W F T N E I E K L G V E E C L F P M
TGGAATGAAATAAGAAAGTGGTTTACAAATGAAATAGAAAAGTTGGGTGTAGAGGAATGCTTATTTCCTATG
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L I P K T F L E K E E S H I S D F S P E V A W I
L I - - - - - - - - - - - - - - - - - - - - - -
TTGATA------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T K C G N E V L H E P V A I R P T S E T V M Y P
- - - - - - - - - - - - A I R P T S E T V M Y -
------------------------------------GCAATAAGACCCACGTCTGAAACAGTTATGTAT---
121122123124125126127128129130131132133134135136137138139140141142143144
S F A R W I S S H R D L P L K V N Q W C N I L R
- - - - - - - - - - - - - L K V N Q W C N I L R
---------------------------------------CTTAAGGTCAATCAGTGGTGCAATATTTTACGG
145146147148149150151152153154155156157158159160161162163164165166167168
W E L R G T T P L I R S K E I L W Q E G H T A H
W - - - - - - - - - - - K E I L W Q E G H T A -
TGG---------------------------------AAAGAAATTCTCTGGCAAGAAGGACACACAGCT---
169170171172173174175176177178179180181182183184185186187188189190191192
I D K E E A D K E V L D I L D L Y Y R M Y K E L
- - - - - - - - - V L D I L D L Y Y R M Y K - -
---------------------------GTTTTAGATATATTAGATTTGTACTACAGAATGTACAAA------
193194195196197198199200201202203204205206207208209210211212213214215216
L A V P V I K G L K T E T E K F A G S D Y S T T
- - - - - - - - - - - - - - - - - - - - - S T T
---------------------------------------------------------------AGTACAACT
217218219220221222223224225226227228229230231232233234235236237238239240
V E G F I P Q A G K G I Q A A T S H H L G Q N F
V E G - - - - - - - - - Q A A T S H H L - - - -
GTTGAAGGG---------------------------CAAGCTGCTACATCGCACCATCTT------------
241242243244245246247248249250251252253254255256257258259260261262263264
S K M F D V K V Q V D D G V S D F V Y Q N S W G
- - - - - - - - - - - - - - - - - V Y Q N S W G
---------------------------------------------------GTTTATCAAAATTCATGGGGA
265266267268269270271272273274275276277278279280281282283284285286287288
M T T R S L G I A V M I H S D D K G L V L P P K
M T T R S L G I - - - - - - - - - - - - - - - -
ATGACTACCAGATCGTTAGGAATT------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
V A K I Q V V I I P C G L S V K T S T E D K N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L L K V I N R I K N Q L L F S K I R V H I D D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
D N V T V G Y K F N H W E I R G V P I R I E I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L K D L E K N E M C I Y K R N T G T K N Q Y T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D D N V T E K I Q L L I N D I H E E M Y N T A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K E Q E S K I L Y I N N I F D F V K K L D E N C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I L M T P W C E S S Q C E E K I K T M S T K F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D E K I L I A G A K S L C I P F E S R K I E H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499
T C I I C K S A C K R Y T L F G R S Y
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_ser_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T W S L L R Y L R E N P E I L R E S L R K R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M D P S L V D K L R K L D E E W R R L K R A V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E I R H R H N I I T R S I A K T K D P E E R K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L I E E A R K L L K E R E Q L E E K L K R V E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E R E K L L L S L P N I V H E S V P V G D S D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y N V P I R F W G R P K V Y R G F L E A F R E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T E K W G F K V D Y E V I D W K P I G H A D M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E H V L R L G D T M K A A E V A G S R F Y Y L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D D L V W L D F A L L M Y A I D H L T S K G Y K
- - - - - L D F A L L M Y A I D H L T S K G Y K
---------------CTAGACTTCGCGCTATTAATGTACGCTATCGATCATCTGACATCAAAGGGGTATAAG
217218219220221222223224225226227228229230231232233234235236237238239240
L V L P P Y M I R H K I L M G V I D M D T F E D
L V L P P Y M I - - - - - - - - - - - - - - - -
CTAGTACTACCACCATACATGATA------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A I Y K I E G E D L Y L I A T A E H P L A G L Y
- - - - - - - - - - Y L I A T A E H P L A - - -
------------------------------TACCTGATCGCAACAGCCGAGCATCCTTTGGCA---------
265266267268269270271272273274275276277278279280281282283284285286287288
Y N E E I M E D E L P L K L V G V S P C F R K E
- - - - - - - - - - - L K L V G V S P C F R K -
---------------------------------CTAAAGCTGGTGGGCGTCAGCCCTTGTTTCCGCAAA---
289290291292293294295296297298299300301302303304305306307308309310311312
A G A G N R D L K G I F R V H Q F H K V E Q Y I
- - - - - - - - - - - - - - H Q F H K V E Q Y I
------------------------------------------CACCAATTCCACAAGGTAGAGCAGTACATC
313314315316317318319320321322323324325326327328329330331332333334335336
Y A K P E E S W D L L E E L I R N A E E L F Q G
Y - - - - - - - - - L E E L I R N A E E L F Q -
TAC---------------------------CTAGAGGAGCTTATACGTAACGCCGAGGAGCTATTCCAG---
337338339340341342343344345346347348349350351352353354355356357358359360
L G L P Y R V V N V A S G E L G A P A A K K Y D
- - - - - - - - - - - - - - - - - - - - - K Y D
---------------------------------------------------------------AAATACGAC
361362363364365366367368369370371372373374375376377378379380381382383384
L E V W M P A Q G R Y R E M V S A S N T T D W Q
L E V - - - - - - - - - E M V S A S N T - - - -
CTAGAGGTA---------------------------GAAATGGTTAGCGCTAGCAATACT------------
385386387388389390391392393394395396397398399400401402403404405406407408
S Y R L N I R L V R R K G M V R E Y V H T L N S
- - - - - - - - - - - - - - - - - - V H T L N S
------------------------------------------------------GTACATACTCTTAACTCT
409410411412413414415416417418419420421422423424425426427428429430431432
T A I A S T R A I T A I L E N F Q E P D G T V V
T A . A S T R A I T A - - - - - - - - - - - - -
ACAGCT---GCCTCCACAAGAGCCATTACGGCT---------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I P K V L R K Y L E P F T K A P K D A I H P V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460
K E K E
- - - -
------------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_ser_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D V K L L R S N R E L F E K N C E Y R G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K A I I D Q F F K L D E E W R S V N R E L N G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R A E K N R M T R A I A E S L K R G K I V S N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K D R V E L I N E K I V S L E K K I R E I E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R D R V L W T I P N L I H E S V P I C F G D E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N K I V R Y V G H A K V Y R D D E E E F L K G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G G N G D Y E V I D E R P K S H V D L G Q E L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I I D L E S A A K I S G A R F Y F I K N R L L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L E M A L E N Y A V D F L S Q R G F T V V E P P
L E M A L E N Y A V D F L S Q R G F T V V E P P
CGTTGCTATTAAATAAAGGTCTTCATCTTCGATTTTATAAAGCGTATCCTTGAACGTTTCGAGGTCTGTTGC
217218219220221222223224225226227228229230231232233234235236237238239240
Y M L N L E S M R G A T D L E T F K D T L Y K I
Y M L - - - - - - - - - - - - - - - - - - - - -
ACCCCTCAT---------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E D E D L Y L I A T S E H S I A S M L S N E F L
- - - - - Y L I A T S E H S I A - - - - - - - -
---------------GAGTGCCATTTCCAGCTTCAACAACCTATTTTT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E E K E L P I R V A G V S A C F R R E A G A H G
- - - - - - I R V A G V S A C F R R - - - - - -
------------------TAAATCAATTATTCCGAGCTCCTGGCCTAAATCTAC------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D T K G I F R V H Q F N K I E Q F I F C K P E
- - - - - - - - - H Q F N K I E Q F I F - - - -
---------------------------TCCTGATCCTTTGAGAAACTCCTCTTCATCATC------------
313314315316317318319320321322323324325326327328329330331332333334335336
D S W D Y L E E I L S N A E E I Y R S L G I P Y
- - - - - L E E I L S N A E E I Y R - - - - - -
---------------CCTAACTATTTTATTATTTTCATCACCAAAGCATATAGG------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R V V N V C S G E L G R L A A K K Y D I E A W F
- - - - - - - - - - - - - - - - K Y D I E A - -
------------------------------------------------GATCTTTTTTTCCAAAGA------
361362363364365366367368369370371372373374375376377378379380381382383384
P A Q G K F R E I V S A S N D T D Y Q A R S L N
- - - - - - - E I V S A S N D - - - - - - - - -
---------------------TCGATCTTTCTCATTACTTACAAT---------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I K Y R K S G G N E F V H T L N S T A I A T T R
- - - - - - - - - - - V H T L N S T A . A T T R
---------------------------------ACCATTCAACTCCCTGTTTACAGA---CCATTCTTCATC
409410411412413414415416417418419420421422423424425426427428429430431432
I L V A I M E N F Q E D G R I R I P D V L V P Y
I L V A - - - - - - - - - - - - - - - - - - - -
CAGCTTGAAAAA------------------------------------------------------------
433434435436437438439440441
T G F Q Y I D K E
- - - - - - - - -
---------------------------
Class II
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_ser_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S W S I L E L I R N N P E A L K E N L K K R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I D T S T V D K A V E L D K K W R Q T L Q E V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R L R H E H N L I S S Q I P K A P K E Q K S E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I N K A K E L L K T L E D K E K E L Q K I E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R E S L L L S L P N L V H D S V P I G P D E S Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S L P I R F W G K F K V Y K D D V N E F L K Q T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N G H K V D Y E I I S W K P V G H A D M L E S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L R L G D T K K A G E V A A S R F Y Y L F N D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V W L D I A L L L Y A I D T I T S R G Y T L V L
- - L D I A L L L Y A I D T I T S R G Y T L V L
------TTAGATATAGCCTTATTACTTTATGCTATTGATACGATAACTTCAAGGGGATATACACTTGTTTTA
217218219220221222223224225226227228229230231232233234235236237238239240
P P Y M L R G E V I K S V I D L D T F K D A I Y
P P Y M L - - - - - - - - - - - - - - - - - - -
CCACCTTACATGCTT---------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K I E G E D L Y L I A T A E H S I A A L Y Y K E
- - - - - - - Y L I A T A E H S I A - - - - - -
---------------------TATTTAATAGCCACAGCCGAACACTCCATAGCA------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E I P R E E L P L K L V G V S P A F R K E A G A
- - - - - - - - L K L V G V S P A F R K - - - -
------------------------CTCAAGTTAGTTGGTGTGAGTCCTGCATTCAGGAAA------------
289290291292293294295296297298299300301302303304305306307308309310311312
A N K D L K G I F R V H Q F H K V E Q F I F S S
- - - - - - - - - - - H Q F H K V E Q F I F - -
---------------------------------CATCAATTTCATAAGGTTGAGCAATTTATCTTC------
313314315316317318319320321322323324325326327328329330331332333334335336
P E D S W K Y H E E M I E N A E E I F R G L G L
- - - - - - - H E E M I E N A E E I F R - - - -
---------------------CATGAAGAAATGATTGAAAACGCAGAAGAGATATTCCGA------------
337338339340341342343344345346347348349350351352353354355356357358359360
P Y R V I N I A S G D L G A P A A K K Y D L E V
- - - - - - - - - - - - - - - - - - K Y D L E V
------------------------------------------------------AAATACGATCTTGAGGTG
361362363364365366367368369370371372373374375376377378379380381382383384
W M P A Q A K F R E M V S C S N C L D W Q A Y R
- - - - - - - - - E M V S C S N C - - - - - - -
---------------------------GAAATGGTTAGTTGTAGTAATTGT---------------------
385386387388389390391392393394395396397398399400401402403404405406407408
M R I R Y V E K N N K K G Y L H T L N S T A I A
- - - - - - - - - - - - - - L H T L N S T A . A
------------------------------------------CTGCATACTTTAAACAGTACAGCA---GCT
409410411412413414415416417418419420421422423424425426427428429430431432
S T R A I T A I L E N Y Q K E D G V V E V P K M
S T R A I T A - - - - - - - - - - - - - - - - -
AGCACCAGGGCTATAACAGCT---------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
L R K Y L E T F S S A P K E Y I Y P K K K P N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458
T S
- -
------
Class II
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_ser_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E L K F S A E V E L T L S R E V D P A E I E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T V E E F V K E A N E D L L Q R G V P T G K E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A K I E S Y R V L E D T I E M E I T G T R Y L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P H E A A M R V R K R L A E R L G R K H R V G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R D L K I P R Y E V V L R F D R E V T R D D V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y V P V A D D V V V E D G T V R L T F Q D V D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E M L R R H V I D R V I R L V A W A V E E R S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L V E R V T K V E P G T V V D E S G P R E I R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D G D V T E E A R R R G W V K E F P G R G Q W I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y T P P M A A L F E V L R D F L L E R V T R K L
- - - - - - - L F E V L R D F L L E R . T R K L
---------------------CTGTTCGAAGTCCTCCGTGACTTCCTTCTGGAGCGT---ACGCGTAAGTTG
241242243244245246247248249250251252253254255256257258259260261262263264
G F E P A L F P K L I P L E T M F R M R Y L H G
G F E P A L F P K L I - - - - - - - - - - - - -
GGCTTCGAGCCCGCCCTGTTCCCGAAGCTAATT---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L P D G M Y Y V C P P K R D P E L F D D F K R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
L Y V W G E L N E R T L G S L K E K L R D P G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
V L A P A Q C E P F Y E L L R D E V V D P E R L
V L A P A Q C E P F Y - - - - - - - - - - - - -
GTTCTGGCACCGGCCCAGTGTGAGCCGTTCTAC---------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P I K L Y D C S G W T Y R W E G G A A K G L E R
- I K L Y D C S . W T Y R W - - - - - - - - - -
---ATCAAGCTCTACGACTGCAGT---TGGACGTACCGGTGG------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V N E F Q R I E H V W I A E P E E A E R I R E E
- N E F Q R I E H V W I - - - - - - - - - R E E
---AACGAGTTCCAGCGGATCGAGCACGTGTGGATC---------------------------CGAGAGGAG
385386387388389390391392393394395396397398399400401402403404405406407408
L L E A T K R V A E E L E L E W K V V V S D D P
L L E A T K R V A E - - - - - - - - - - - - - -
TTACTGGAAGCTACCAAGCGGGTCGCGGAA------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
F Y L E G R L L E D R D I E L P D V P S Y E F E
- - - - - - - - - - - - - - - - - - - S Y E F E
---------------------------------------------------------TCGTACGAGTTCGAA
433434435436437438439440441442443444445446447448449450451452453454455456
V Y L P F K G E R S S E E A W I S V G S F N V H
V - - - - - - - - - - - - - - - S V G S F N V H
GTC---------------------------------------------TCGGTGGGCTCGTTCAACGTGCAC
457458459460461462463464465466467468469470471472473474475476477478479480
G E H F V D G F N V K E K S G R T L F T G C A G
- - - - - - - - - - - - - - - - - L F T G C A G
---------------------------------------------------CTGTTCACGGGCTGTGCGGGT
481482483484485486487488489490491492493494495496497498499500501502503504
L G V T R W V V G L L A Q H G F E P E E W P E P
- G V T R W V V G - - - - - - - - - - - - - - -
---GGTGTCACCCGATGGGTGGTTGGG---------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527
I L E R I D E K F G G L P E V P K T L T W P E
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_ser_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I R F V R A N P D A I R E D L K K R N D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E K L A W I D D L L V Q D I R H R E L I G Q T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E L R R R R N S I S Y D I N R A K K A G E D A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L I A E A A G L P G R I K E N E A E M E E I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K K I R Y Y L M R I P N I L H E S V P V G A D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T Q N V E V K R Y G T P R T F T F E L K N H G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L A A D N D W A D F E R A T K T S G A G F Y F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K G N L V L L D L A L Q R F S L D I L M E K G Y
- - - - - - L D L A L Q R F S L D I L M E K G Y
------------------TGGTAGATCCTTCTCTTCAAAAATTTCATCCTGGTACATTGCTGCCATCGGATG
193194195196197198199200201202203204205206207208209210211212213214215216
T P I I P P Y M I N R K S Y E E V T D L D D F E
T P I I P P Y M I - - - - - - - - - - - - - - -
CTCACTGGTGGCGATCAGGTATGCATC---------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K V M Y K I E D D D A Y L I A T S E H P M A A M
- - - - - - - - - - - Y L I A T S E H P M A - -
---------------------------------GTATGGAGGTATGATGGGCGTATACCCTTTTTC------
241242243244245246247248249250251252253254255256257258259260261262263264
Y Q D E I F E E K D L P L R L A G L S P C F R R
- - - - - - - - - - - - L R L A G L S P C F R R
------------------------------------AAGCACCAGATTTCCTTTCAGAAAATAAAAGCCCGC
265266267268269270271272273274275276277278279280281282283284285286287288
E I G S H G L D T K G L F R V H Q F H K V E Q F
- - - - - - - - - - - - - - - H Q F H K V E Q F
---------------------------------------------TGCAGCAAGTTGCCCGTGGTTTTTAAG
289290291292293294295296297298299300301302303304305306307308309310311312
V Y C H P D D S W T I H E E L R E N A E E I F Q
V Y - - - - - - - - - H E E L R E N A E E I F Q
TTCAAA---------------------------CTTCACCTCGACATTCTGGGTATCATCAGCACCAACCGG
313314315316317318319320321322323324325326327328329330331332333334335336
K L E I P Y R V V N I C T G D I G T V A A K K Y
- - - - - - - - - - - - - - - - - - - - - - K Y
------------------------------------------------------------------CATCTC
337338339340341342343344345346347348349350351352353354355356357358359360
D I E A W M P R E N E Y R E V V S C S N C T T Y
D I E A - - - - - - - - - E V V S C S N C - - -
AGCTTCATTTTC---------------------------TTCAGCGATGAGTGCAGATGCATC---------
361362363364365366367368369370371372373374375376377378379380381382383384
Q A V R L N I R V R D K E D F E S K Q F V H T L
- - - - - - - - - - - - - - - - - - - - V H T L
------------------------------------------------------------CTGACCAATAAG
385386387388389390391392393394395396397398399400401402403404405406407408
N S T A I A T S R A M R A I L E N N Q Q E D G S
N S T A . A T S R A M R A - - - - - - - - - - -
TTCACGGTGACG---ATCCTGAACAAGCAGGTCATCTAT---------------------------------
409410411412413414415416417418419420421422423424425
V V I P K V L R P Y M N D K E F L
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Archaea/Archaeoglobus fulgidus/amino acid sequences/ser_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M W S I L K A V R E N P E I L Y E S Q R R R G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S V D I V D R A I E L D R K W R E E L K R V N Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L R K R R N E L A R A V K E A K G E E R A K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E E A K A V S E E V K R A E E E L K R L E A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E E V L L S I P N I I H E S V P V G K D D S E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V P I K Y W G K A K V Y F E D V D A F V E M T Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G M A E Y E V T D V K P I G H A D A V E I F G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A D L E R A A K V A G A R F Y Y L L N D L V W L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------CAG
193194195196197198199200201202203204205206207208209210211212213214215216
D F A L T M Y A L D F L R K E D F T I V S P P Y
D F A L T M Y A L D F L R K E D F T I V S P P Y
AACCTCCCTCATGTGCATCGCAGCTATTGGATGCTCGCTTGTGGCTATAAGATAGAGGTCTTCATCTTCAAC
217218219220221222223224225226227228229230231232233234235236237238239240
M M R R E A Y S G V T A F S D F E E V I Y K V E
M M - - - - - - - - - - - - - - - - - - - - - -
CTTGTA------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D E D L Y L I A T S E H P I A A M H M R E V L E
- - - - Y L I A T S E H P I A - - - - - - - - -
------------TGTGAAGTCCTCCTTTCTCAGAAAGTCAAGGGC---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E R E L P L L Y A G V S P C F R K E A G A H G K
- - - - - L L Y A G V S P C F R K - - - - - - -
---------------CAGGTAGTAGAACCTCGCCCCCGCAACCTTTGCCGC---------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D T K G I F R V H Q F N K V E Q F V F C L P E Q
- - - - - - - - H Q F N K V E Q F V F - - - - -
------------------------ACCGATAGGTTTGACGTCCGTAACTTCATACTC---------------
313314315316317318319320321322323324325326327328329330331332333334335336
S W E W H E K L I E N V E K L W Q G L G I P Y R
- - - - H E K L I E N V E K L W Q - - - - - - -
------------GGCATCAACATCCTCGAAGTAGACCTTCGCCTTCCCCCA---------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I V N I C T G D L G I V A A K K Y D L E A W M P
- - - - - - - - - - - - - - - K Y D L E A - - -
---------------------------------------------AATTGAAAGCAGAACTTC---------
361362363364365366367368369370371372373374375376377378379380381382383384
A Q A K Y R E M V S C S N C T D W Q S Y R L D I
- - - - - - E M V S C S N C - - - - - - - - - -
------------------CTCCTCCTCAGCCCTTTTAACCTC------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R F A E E R G K P S K G F V H T L N S T A I A T
- - - - - - - - - - - - - V H T L N S T A . A T
---------------------------------------CGCCAGCTCGTTTCTCCGCTTTCT---CTGGTT
409410411412413414415416417418419420421422423424425426427428429430431432
T R A I T A I I E N F Q L E D G R V E I P R V L
T R A I T A - - - - - - - - - - - - - - - - - -
TACCCTCTTAAGCTCTTC------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453
R K Y L E P I E S A P K D F I M P A K S Q
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_ser_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K F K L K G I I K L S K E V P G I E D D L E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F F T E A E S D I L R R G V P E G Q E H E A A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I K S W R L E G D T L H I E M E S G R R V R A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
D G L L R L K K P L G Q L L G P K Y R V G V R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I S V T D Y T M E M K A P G V S G I P S L A E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P F V E D A A I T D G T I M V R F Q P L E E S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L R K H V F D R V V K H A R T L V E S S D D L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V Q V T R A T P G E I I A R S R S R D F F F E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D P T E E A M R L G W V K K F P G R G Q W F Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P K I T A L H R A L E E F F I E R I V K P L G F
- - - - - L H R A L E E F F I E R . V K P L G F
---------------CTCCACCGGGCCCTGGAGGAGTTCTTCATTGAAAGG---GTGAAACCCCTGGGATTT
241242243244245246247248249250251252253254255256257258259260261262263264
V E C L F P K L I P L D I M N K M R Y L E G L P
V E C L F P K L I - - - - - - - - - - - - - - -
GTTGAGTGCCTCTTCCCCAAACTCATA---------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E G M Y Y C S A P S R D P E T F E E F K N E L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
I N R E V P M D L L K R G I K D P G Y V I A P A
- - - - - - - - - - - - - - - - - - - V I A P A
---------------------------------------------------------GTTATAGCCCCGGCC
313314315316317318319320321322323324325326327328329330331332333334335336
Q C E P F Y Q F L S H E V V S A E D L P V K F F
Q C E P F Y - - - - - - - - - - - - - - V K F F
CAGTGCGAACCCTTCTAC------------------------------------------GTAAAGTTCTTT
337338339340341342343344345346347348349350351352353354355356357358359360
D R S G W T Y R W E A G G S K G L D R V H E F Q
D R S . W T Y R W - - - - - - - - - - - H E F Q
GACAGGAGC---TGGACCTACAGGTGG---------------------------------CATGAATTCCAG
361362363364365366367368369370371372373374375376377378379380381382383384
R V E L V W L A E P G E T E E I R D R T V E L S
R V E L V W L - - - - - - - - - R D R T V E L S
AGGGTGGAACTCGTATGGCTG---------------------------CGTGACCGGACAGTTGAACTCTCA
385386387388389390391392393394395396397398399400401402403404405406407408
H D A A D E L E L E W Y T E V G D D P F Y L E G
H D A A D - - - - - - - - - - - - - - - - - - -
CATGATGCCGCCGAT---------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R K V E E R G I E F P D V P K Y E M R L S L P G
- - - - - - - - - - - - - - K Y E M R L - - - -
------------------------------------------AAGTATGAGATGAGGCTC------------
433434435436437438439440441442443444445446447448449450451452453454455456
R E K G V A V V S A N V H G T H F I E G F S I R
- - - - - A V V S A N V H - - - - - - - - - - -
---------------GCAGTTGTATCAGCCAATGTCCAT---------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E A R N L N I W T G C T G I G L S R W I Y G F L
- - - - - - I W T G C T G - G L S R W I Y G - -
------------------ATCTGGACCGGCTGCACCGGC---GGGCTCTCAAGGTGGATCTATGGT------
481482483484485486487488489490491492493494495496497498499500501502503504
A Q K G F E T G N W P D F I G E R V E G V E N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513
R I I T W P R Q D
- - - - - - - - -
---------------------------
Class II
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_ser_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S Y S V L E A L R N S P D V V R K V L T A R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M D A S L V D K F L E L D E K W R R L K K E V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E L R H E Y N K L S K E G A K A P P E R R R E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A D K A R E L A A R L E R A E K E L E E T E R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R E E V L W S F P N L I H E S V P I C P E G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S I P V R H W G V V K T T K D V V D K L D K G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D Y L V V E K A P V G H A D M A E V V L K M A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
T L K A G E V A G S R F Y Y L F D D L V W L D F
- - - - - - - - - - - - - - - - - - - - - L D F
---------------------------------------------------------------CTCGACTTC
193194195196197198199200201202203204205206207208209210211212213214215216
A L A M Y A L D Y L A Q K G F R P V I P P Y M L
A L A M Y A L D Y L A Q K G F R P V I P P Y M L
GCCCTCGCCATGTACGCATTAGACTACCTAGCCCAGAAGGGGTTTAGGCCTGTGATCCCGCCGTATATGTTG
217218219220221222223224225226227228229230231232233234235236237238239240
K Y D L I R R V L D F D T F K D A I Y K I D G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D L Y L I A T A E H G I A A Y L Y K R E L L E E
- - Y L I A T A E H G I A - - - - - - - - - - -
------TACCTAATCGCCACGGCGGAGCACGGAATAGCG---------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E L P Q L Y V G W S P C F R K E A G A G S R D I
- - - Q L Y V G W S P C F R K - - - - - - - - -
---------CAACTTTACGTGGGGTGGTCTCCATGTTTTAGAAAA---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K G I F R V H I F H K V E Q F V F S L P E D S W
- - - - - - H I F H K V E Q F V F - - - - - - -
------------------CATATATTCCACAAAGTGGAGCAGTTCGTCTTC---------------------
313314315316317318319320321322323324325326327328329330331332333334335336
K W H E E I T K N T E E L I R G L G L P Y R V V
- - H E E I T K N T E E L I R - - - - - - - - -
------CATGAGGAAATAACTAAAAACACCGAGGAGCTCATAAGA---------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N I C A H D L G A P A A K K Y D I E V W Y P S Q
- - - - - - - - - - - - - K Y D I E V - - - - -
---------------------------------------AAATACGACATAGAAGTG---------------
361362363364365366367368369370371372373374375376377378379380381382383384
G M Y R E L A S C S N V T D W Q S Y R L G I R V
- - - - E L A S C S N V - - - - - - - - - - - -
------------GAATTGGCGAGTTGTTCAAACGTA------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
T R K G M K R E Y V H T L N C T G L A T T R T I
- - - - - - - - - V H T L N C T G . A T T R T I
---------------------------GTCCACACGCTTAACTGCACAGGT---GCGACCACGAGGACAATA
409410411412413414415416417418419420421422423424425426427428429430431432
T A I L E N F Q R E D G A V E I P K V L R Q Y L
T A - - - - - - - - - - - - - - - - - - - - - -
ACTGCC------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451
E P I K A A P K D Y I L P K A A K S P
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_ser_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D V K L L R S N R E L F E K N C E Y R G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K A P V E D F F R L D E E W R S I N R E L N G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R S Q K N R E T R K I A E L I K N N G D A S A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K K A V E D I N A R I S D L E N K L K K I E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R D R I L W T I P N L V H E S V P V C F G D E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N Q L V R Y V G H A K V F R D D I E E F K K N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G N S Q D Y E V L D E R P K S H V D L G L D L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V I D L E S A A R I S G S R F Y F I K N R L L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L E M A L E N Y A V D F L S Q R G F S I V E P P
L E M A L E N Y A V D F L S Q R G F S I V E P P
CTGGAAATGGCGCTTGAGAACTATGCGGTGGATTTCCTTTCGCAGAGAGGGTTTTCGATAGTGGAACCCCCC
217218219220221222223224225226227228229230231232233234235236237238239240
Y M L N L E S M R G A T D L E T F K D T L Y K I
Y M L - - - - - - - - - - - - - - - - - - - - -
TATATGCTG---------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E G E D L Y L I A T S E H S I A A M L S N Q F L
- - - - - Y L I A T S E H S I A - - - - - - - -
---------------TACCTTATAGCAACTTCGGAGCATTCCATAGCA------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E E K D L P L R V A G I S A C F R R E A G A H G
- - - - - - L R V A G I S A C F R R - - - - - -
------------------CTCAGGGTGGCCGGTATATCGGCATGCTTCAGGCGT------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D T K G I F R V H Q F N K I E Q F V F C K P E
- - - - - - - - - H Q F N K I E Q F V F - - - -
---------------------------CATCAGTTCAACAAGATAGAGCAGTTCGTTTTC------------
313314315316317318319320321322323324325326327328329330331332333334335336
D S W D F L E E I L G N A E A I Y R S L G I P Y
- - - - - L E E I L G N A E A I Y R - - - - - -
---------------CTTGAGGAGATTCTCGGCAATGCTGAAGCCATATACAGG------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R V V N V C S G E L G R L A A K K Y D I E A W F
- - - - - - - - - - - - - - - - K Y D I E A - -
------------------------------------------------AAGTACGATATAGAGGCC------
361362363364365366367368369370371372373374375376377378379380381382383384
P A Q G K F R E I V S A S N D T D Y Q A R S L N
- - - - - - - E I V S A S N D - - - - - - - - -
---------------------GAGATAGTGTCGGCTTCAAACGAC---------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I K Y R T S E G N R F V H T L N S T A I A T T R
- - - - - - - - - - - V H T L N S T A . A T T R
---------------------------------GTCCACACGCTCAACAGCACGGCG---GCGACGACTAGG
409410411412413414415416417418419420421422423424425426427428429430431432
I L V A I M E N F Q E G D R I R I P D V L V P Y
I L V A - - - - - - - - - - - - - - - - - - - -
ATACTGGTAGCC------------------------------------------------------------
433434435436437438439440441
T G F Q Y I E K G
- - - - - - - - -
---------------------------
Class II
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_ser_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K F E L N G K I I F S K E I T D D A K K D I I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E V L N D R T I L L K G V P T G K E E E A S K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V N Y E F K G N E L I L N I I S G T Y A R A H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A I I R L K K P I M E K V G K I H K M G I R D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K I D N Y E I T I N A P H N I D A L E N L K V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E C E T E L N E E E N T I K I I F K N I G D S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L K R N I V D R A I K F V K T E I D N I G D S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E E C D L T Y E V C G I A P N T I V S E Y K A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R T I S Y N K D P T E E S E K L G W V K R F S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K G Q W F Y T P P M T K L L R A F E E L L M E E
- - - - - - - - - - - - L L R A F E E L L M E E
------------------------------------CATCATTTCATTTACAAACTCTTTAAACATCTCTGG
241242243244245246247248249250251252253254255256257258259260261262263264
C I N K I G F D E C L F P K L I P L E V M Y K M
. I N K I G F D E C L F P K L I - - - - - - - -
---TCTTTTTGGCGGAGATACATAATACATTCCCTCAGGAAGCCCTTC------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R Y L E G L P E G M Y Y V S P P K R D P E M F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
E F V N E M M I K N E I P I H K L K D L L R N P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
G Y V L A P A Q C E P F Y Q F F D H E L V D I D
- - V L A P A Q C E P F Y - - - - - - - - - - -
------GCCTAATTTTTCGCTTTCTTCTGTTGGGTCTTT---------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
N P V K F V D K S G W T Y R W E G G G S K G L D
- - V K F V D K S . W T Y R W - - - - - - - - -
------AATTGTATTTGGAGCTATTCC---CACTTCATAAGTTAA---------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R V H E F L R I E T V Q M G A P E F V N S V R D
- - H E F L R I E T V Q M - - - - - - - - - R D
------AATTTCTGTTTTTACAAATTTAATTGCTCTATC---------------------------TCCAAT
385386387388389390391392393394395396397398399400401402403404405406407408
D T L K Y A E K L A E K L D L E Y W T E V G D D
D T L K Y A E K L A E - - - - - - - - - - - - -
ATTTTTAAATATGATTTTTATAGTATTTTCTTC---------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
P F Y L E G R K K E E R N I E F P E V P K Y E M
- - - - - - - - - - - - - - - - - - - - K Y E M
------------------------------------------------------------ATCTCTTATTCC
433434435436437438439440441442443444445446447448449450451452453454455456
R L W L P H V K D E R K G V A V T S A N V H G T
R L - - - - - - - - - - - - A V T S A N V H - -
CATTTT------------------------------------TAATCTAATAATTGCCTCATGGGC------
457458459460461462463464465466467468469470471472473474475476477478479480
H F V E G F G V K D Y K N R T V W T G C T G F G
- - - - - - - - - - - - - - - V W T G C T G - G
---------------------------------------------TTCATAATTTACTATTTTTGA---TTC
481482483484485486487488489490491492493494495496497498499500501502503504
L S R W V I G F L A Q Y G F D Y N D W P E L I K
L S R W V I G - - - - - - - - - - - - - - - - -
TTCCTCTTTTCCAGTAGGCAC---------------------------------------------------
505506507508509510511512513514515516517518519520521522
D K I G E M P N I P K V I T W P K K
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_ser_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D V E F L R K Y P E K Y K E M L K K R F M D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T S I V D E F L A Y D N L W R S L K K E L D N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R C L H N A I S K A I A T G K L E H N C N T K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E L K D D K E Y L I T L A K S L K K E I E I L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K Q L K E I E S K R N D I L W R M P N Y I R E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V P I G E D E R Y N K P L K Y W G V A K V L D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E K F K Q E T Q R K P I N I L E L D P R Y I K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L T Y K E L I D F L R S T N P E Y F V N P D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A I D F D L L N K E G L V L Y I K I D K A K H H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y D L T K E L N I A D Q E L G S K I A G S R F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
V E F E K G L F M E L K L I K F V L E T L K S R
- - - - - - - - M E L K L I K F V L E T L K . .
------------------------AGAGCCAGCTATCTTTGAGCCTAATTCTTGGTCGGCAATATT------
265266267268269270271272273274275276277278279280281282283284285286287288
T E G K Y N Y K I M K L P Y L V R G W V E K A A
. . . K Y N Y K I M K L P Y L V - - - - - - - -
---------ATCATAATGATGTTTAGCTTTGTCTATTTTTATATATAA------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
A Y F T A F E D T L Y K I E G E D L Y L N P T A
- - - - - - - - - - - - - - - - - - Y L N P T A
------------------------------------------------------AAGAAAATCTATTAATTC
313314315316317318319320321322323324325326327328329330331332333334335336
E H P I A G L Y K D Y Y F N D N E L P L I V Y G
E H P I A - - - - - - - - - - - - - - L I V Y G
TTTGTATGTTAGGCT------------------------------------------TTTTCTTTGAGTTTC
337338339340341342343344345346347348349350351352353354355356357358359360
F T T A F R K E A G S H G K D T K G I F R V H Q
F T T A F R K - - - - - - - - - - - - - - - H Q
TTGTTTGAATTTTTCTACATC---------------------------------------------TTCGTC
361362363364365366367368369370371372373374375376377378379380381382383384
F E K I E Q Y A F T T K E Q L L E I Y N F L V S
F E K I E Q Y A F - - - - - - - - - Y N F L V S
TTCTCCAATGGGGACATCTTCTCTAAT---------------------------GTTTCTCTTACTTTCTAT
385386387388389390391392393394395396397398399400401402403404405406407408
N A E T I V K K L G L P Y R I V F N S S G D M D
N A E T I V K - - - - - - - - - - - - - - - - -
TTCCTTCAATTGTTTTTCCAA---------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K K V T M Q W D L E V Y Y P A Q E K Y R E L H S
- - - - - Q W D L E V - - - - - - - - - E L H S
---------------TATTTTTGTATTGCAATT---------------------------CTTAGAGATTGC
433434435436437438439440441442443444445446447448449450451452453454455456
F G T V E E W Q A R R L N I K Y S K G Y V N T I
F G T V - - - - - - - - - - - - - - - - V N T I
ATTGTGCAAACA------------------------------------------------AGCCAAAAATTC
457458459460461462463464465466467468469470471472473474475476477478479480
Y A T A L P I Q R A M T A L L E N N L F E L N Y
Y A T A . P I Q R A M T A - - - - - - - - - - -
GTCAACTATACT---ATCCATGAATCTTTTCTTTAACAT---------------------------------
481482483484
N R L K
- - - -
------------
Class II
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_ser_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L E L K F V R N N P D I V G R A L V N R N M G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T E L I D S L L E Y D V A W R K C L T E G D S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K H K R N V V T R E I A Q L K K E N K D T L S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I N E M Q D I N N R I K E I D D K I R D Y K S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I N E I M L S I P N I P S E T T P V G K D E N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N P V V R V V G E K K K F T F T P K P H W E I G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E A L D I L D F E R G A K I A G Q G F T V Y K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L G A K L E R A L I N F M L D V H T R Q G Y L E
- - - - L E R A L I N F M L D V H T R Q G Y L E
------------CTTGAAAGAGCCCTCATAAACTTCATGCTTGATGTACACACCAGGCAGGGGTATCTCGAA
193194195196197198199200201202203204205206207208209210211212213214215216
V F P P V L I N E K A M T G T G Q L P K F K E D
V F P P V L I - - - - - - - - - - - - - - - - -
GTTTTCCCGCCTGTGCTAATC---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
M Y L C C A D G Y Y L A P T A E V P V T N L F M
- - - - - - - - - Y L A P T A E V P V T - - - -
---------------------------TATCTTGCCCCGACTGCAGAAGTCCCGGTGACC------------
241242243244245246247248249250251252253254255256257258259260261262263264
D E Y M E N L P V S L T A Y T A C F R R E A G K
- - - - - - - - V S L T A Y T A C F R R - - - -
------------------------GTATCCCTTACAGCATATACCGCCTGCTTCAGGCGG------------
265266267268269270271272273274275276277278279280281282283284285286287288
H G Q D T R G I I R Q H Q F N K V E L V K F V K
- - - - - - - - - - - H Q F N K V E L V K F - -
---------------------------------CACCAGTTCAACAAGGTTGAACTTGTCAAGTTC------
289290291292293294295296297298299300301302303304305306307308309310311312
P E T S Y E E L E K L T L D A E E I L K L L K L
- - - - - - - L E K L T L D A E E I L K - - - -
---------------------CTGGAAAAACTCACCCTCGATGCCGAAGAGATTCTAAAA------------
313314315316317318319320321322323324325326327328329330331332333334335336
P Y R L V T L C T G D L G F S A A K T Y D I E V
- - - - - - - - - - - - - - - - - - T Y D I E V
------------------------------------------------------ACCTACGACATTGAGGTA
337338339340341342343344345346347348349350351352353354355356357358359360
W V P T Q E K Y R E I S S C S N F E N F Q A R R
- - - - - - - - - E I S S C S N F - - - - - - -
---------------------------GAGATCTCCTCGTGCTCGAATTTC---------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A N I R F R T P E G P Q F V H T L N G S G L A V
- - - - - - - - - - - - - V H T L N G S G . A V
---------------------------------------GTCCACACGCTTAACGGCTCAGGC---GCTGTA
385386387388389390391392393394395396397398399400401402403404405406407408
G R T V V A I L E N Y Q R E D G S V E I P E V L
G R T V V A - - - - - - - - - - - - - - - - - -
GGCAGGACCGTCGTTGCT------------------------------------------------------
409410411412413414415416417418419420421
R P Y M G G V E E I R E E
- - - - - - - - - - - - -
---------------------------------------
Class II
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_ser_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I K L I R E N P E L V K N D L I K R G E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E K V K W V D E I L K L D T E W R T K L K E I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R L R H E R N K I A V E I G K R R K K G E P V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E L L A K S R E I V K R I G E L E N E V E E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K K I D Y Y L W R L P N I T H P S V P V G K D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N D N V P I R F W G K A R V W K G H L E R F L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Q S Q G K M E Y E I L E W K P K L H V D L L E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L G G A D F A R A A K V S G S R F Y Y L L N E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V I L D L A L I R F A L D R L I E K G F T P V I
- - L D L A L I R F A L D R L I E K G F T P V I
------CGCGTGCATTCCAGCTAAGGGGTGTTCAGCGGTCGGAATTAGATATAGATCCTCATCTTCAACCTT
217218219220221222223224225226227228229230231232233234235236237238239240
P P Y M V R R F V E E G S T S F E D F E D V I Y
P P Y M V - - - - - - - - - - - - - - - - - - -
GTATATAACATCCTC---------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K V E D E D L Y L I P T A E H P L A G M H A N E
- - - - - - - Y L I P T A E H P L A - - - - - -
---------------------CTCTATGAGCCTGTCAAGGGCGAACCTAATTAG------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I L D G K D L P L L Y V G V S P C F R K E A G T
- - - - - - - - L L Y V G V S P C F R K - - - -
------------------------CCTGGAACCGCTGACCTTCGCGGCCCTTGCGAAGTC------------
289290291292293294295296297298299300301302303304305306307308309310311312
A G K D T K G I F R V H Q F H K V E Q F V Y S R
- - - - - - - - - - - H Q F H K V E Q F V Y - -
---------------------------------CCATTCAAGAATTTCATACTCCATCTTCCCTTG------
313314315316317318319320321322323324325326327328329330331332333334335336
P E E S W E W H E K I I R N A E E L F Q E L E I
- - - - - - - H E K I I R N A E E L F Q - - - -
---------------------GCCTTTCCAAACTCTGGCTTTTCCCCAGAATCTTATGGG------------
337338339340341342343344345346347348349350351352353354355356357358359360
P Y R V V N I C T G D L G Y V A A K K Y D I E A
- - - - - - - - - - - - - - - - - - K Y D I E A
------------------------------------------------------GTAATAATCGATCTTTTT
361362363364365366367368369370371372373374375376377378379380381382383384
W M P G Q G K F R E V V S A S N C T D W Q A R R
- - - - - - - - - E V V S A S N C - - - - - - -
---------------------------TTCTCCTATTCTTTTGACGATCTC---------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L N I R F R D R T D E K P R Y V H T L N S T A I
- - - - - - - - - - - - - - - V H T L N S T A .
---------------------------------------------GATCTTGTTTCTCTCATGCCTAAG---
409410411412413414415416417418419420421422423424425426427428429430431432
A T S R A I V A I L E N H Q E E D G T V R I P K
A T S R A I V A - - - - - - - - - - - - - - - -
GTTTATCTCCTTAAGCTTAGTCCT------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455
V L W K Y T G F K E I V P V E K K E R C C A T
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_ser_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D L Q R I R Q E P D R V R E A I R T K G L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D P E L V D R V L A L D A E H R R T L T E L Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T R H R Q N T L A R Q I G Q L M R E G R R D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q A L I E E N T R L K E H V K T L E A R A R E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G E E L E A L L L E I P N I P H P S V P V G R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
P E D N V V L H E E G C P P T F D F E P L P H W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E L A A R H G L I D F E R G A K V T G S G F P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y V G K G A R L Q R A L I Q F F L D L A V Q Q G
- - - - - - - L Q R A L I Q F F L D L A V Q Q G
---------------------CTGGCTTTCCTCCAGAATTTCGTCGCGGAAGTAGTTCGTGACGGGCACCTC
193194195196197198199200201202203204205206207208209210211212213214215216
G Y T E I Q P P L F V N A D S A R G T G Q L P D
. Y T E I Q P P L F V - - - - - - - - - - - - -
---CGTGGGGATCGGATAGAGGCCGTCCCGTTC---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K E D L M Y V I E R D G L Y P I P T A E V P V T
- - - - - - - - - - - - - Y P I P T A E V P V T
---------------------------------------CTGGATTTCGGTGTAGCCGCCCTGCTGCACGGC
241242243244245246247248249250251252253254255256257258259260261262263264
N Y F R D E I L E E S Q L P I K F C A Y S P C F
- - - - - - - - - - - - - - I K F C A Y S P C F
------------------------------------------TCCTTTGCCCACGTAGAACGGAAAGCCGCT
265266267268269270271272273274275276277278279280281282283284285286287288
R R E A G S Y G R D V R G L N R L H Q F D K V E
R R - - - - - - - - - - - - - - - H Q F D K V E
TCCGGT---------------------------------------------CAGCTCCCAGTGGGGCAGCGG
289290291292293294295296297298299300301302303304305306307308309310311312
L V Q F V H P D T S Y D A L E Q L R E D A E R P
L V Q F - - - - - - - - - L E Q L R E D A E R P
CTCGAAGTCGAA---------------------------CACCACGTTGTCCTCGGGGCCGCGTCCGACGGG
313314315316317318319320321322323324325326327328329330331332333334335336
L R L L G L P Y R R V L M C T A E T G F T Q A K
L R - - - - - - - - - - - - - - - - - - - - - -
CACCGA------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K Y D L E V W S P G Q Q R W L E V S S I S N F E
K Y D L E V - - - - - - - - - E V S S I S N F -
GGCTTCCAGCGTCTTGAC---------------------------GATGAGGGCCTGCGCTTCGTCGCG---
361362363364365366367368369370371372373374375376377378379380381382383384
D F Q A R R A R V R F R P A D G G R P R F V H T
- - - - - - - - - - - - - - - - - - - - - V H T
---------------------------------------------------------------CAGTTCGGT
385386387388389390391392393394395396397398399400401402403404405406407408
L N G S G L A L P R V V A A L L E H Y Q Q A D G
L N G S G . A L P R V V A A - - - - - - - - - -
CAGGGTGCGGCGATG---GGCGTCGAGTGCGAGCACGCGATC------------------------------
409410411412413414415416417418419420421422423424425426
S I V I P E V L R P Y T G F D R I G
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Archaea/Staphylothermus marinus/Smarinus_ser_aa
Archaea/Staphylothermus marinus/Smarinus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S W S I L K L L R E K P E E L K E H V K K R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M D P S I V D E A Y K T D L E W R R T L T Y I Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E L R H K H N V V S R E I P K L K G V D K E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I K E A K Q L L K E L E E V E K K L K E L E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R Q K L L F S L P N I V H E T V P V G P D D T Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N V P I R F W G K P R V W K G F I D Q F K E Q T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E K Y G F K V E Y E V I D W K P V G H A D M L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K V L R L G D T F K A G Q V A G S R F Y Y L F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D I V F L D M A L L A Y A I D Y L T S K G Y T L
- - - - L D M A L L A Y A I D Y L T S K G Y T L
------------TGCATGAAGAGCTGCTAATGGATGTTCTGCAGTTGCAATTAAGTATAAGTCTTCCCCCTC
217218219220221222223224225226227228229230231232233234235236237238239240
V L P P Y M L R H K V M M G V I D M D T F K D A
V L P P Y M L - - - - - - - - - - - - - - - - -
AATCTTATATATGGCGTCTTT---------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
I Y K I E G E D L Y L I A T A E H P L A A L H A
- - - - - - - - - Y L I A T A E H P L A - - - -
---------------------------ACTTGTTAAGTAATCGATCGCATAAGCTAGCAA------------
265266267268269270271272273274275276277278279280281282283284285286287288
W E D I P E E E L P L K Y V G I S P C F R K E A
- - - - - - - - - - L K Y V G I S P C F R K - -
------------------------------CCTGCTTCCAGCAACTTGTCCAGCTTTAAAAGTATC------
289290291292293294295296297298299300301302303304305306307308309310311312
G A G N R D L K G I F R V H Q F H K V E Q F V Y
- - - - - - - - - - - - - H Q F H K V E Q F V Y
---------------------------------------TTTCCAATCAATTACTTCATATTCTACTTTGAA
313314315316317318319320321322323324325326327328329330331332333334335336
A K P E D S W D I M E E L I S N A E H L F R G L
- - - - - - - - - M E E L I S N A E H L F R - -
---------------------------TTGATCAATGAAACCTTTCCAAACTCTTGGTTTCCCCCA------
337338339340341342343344345346347348349350351352353354355356357358359360
G I P Y R I V N I A S G D L G A P A A K K Y D L
- - - - - - - - - - - - - - - - - - - - K Y D L
------------------------------------------------------------TAGTGAAAATAG
361362363364365366367368369370371372373374375376377378379380381382383384
E A W M P A Q G R Y R E M V S C S N V T D W Q A
E A - - - - - - - - - E M V S C S N V - - - - -
AAGTTT---------------------------TTTCTTCTCTACTTCTTCGAGTTC---------------
385386387388389390391392393394395396397398399400401402403404405406407408
F R L R I R L I R R K G M V K E Y L H T L N S T
- - - - - - - - - - - - - - - - - L H T L N S T
---------------------------------------------------ACGGCTTACAACATTATGTTT
409410411412413414415416417418419420421422423424425426427428429430431432
A I A S T R T I T A I L E N F Q E P D G T V I V
A . A S T R T I T A - - - - - - - - - - - - - -
GTG---AAGCTCTTGTATATATGTAAGAGT------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P K V L R K Y L E V F K S A P I D A I H P V K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459
E K N
- - -
---------
Class II
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_ser_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K L T F D L D G K I I F S K E L S E E A K N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V E E V L K N A D S I F L K G V P K G K E N E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S K I K S Y E F E G N I L K L K I A S G T Y T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A H E G L I R L R K P L A E K L G R N F R I G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R G I E I D N Y V I T I E T D E D K A K K L E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I K V P E C E A K V E G N K I I L T F K D I G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
S E L K R N I I D R A I K F V K T E L E K E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D L T F K V C K I P P G T I V S E Y K A K R K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T F D K D P T D V A E K L G W V K K F P G R G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
W F Y T P P I T A L F R A L E E L I V E E V V K
- - - - - - - - - L F R A L E E L I V E E V . K
---------------------------AATCTCTTTTTTAATCATCATCTCATTTACAAACTCTTT---AAG
241242243244245246247248249250251252253254255256257258259260261262263264
K I G F Q E C L F P K L I P L E I M Y K M R Y L
K I G F Q E C L F P K L I - - - - - - - - - - -
CTCTGGCTCCCTCTTTGGTGGGCATACGTAATACATTCC---------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E G L P E G M Y Y V C P P K R E P E L F K E F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N E M M I K K E I P I E K L K N L L R D P G Y V
- - - - - - - - - - - - - - - - - - - - - - - V
---------------------------------------------------------------------GAA
313314315316317318319320321322323324325326327328329330331332333334335336
L A P A Q C E P F Y Q F F E G E V I D V D K P I
L A P A Q C E P F Y - - - - - - - - - - - - - I
TTTTTTAACCCATCCAAGTTTTTCAGCAAC---------------------------------------CTT
337338339340341342343344345346347348349350351352353354355356357358359360
M F F D R S G W T Y R W E G G G A R G L D R V N
M F F D R S . W T Y R W - - - - - - - - - - - N
ATATTCACTAACTATTGT---AGGTGGAATTTTACA---------------------------------CAA
361362363364365366367368369370371372373374375376377378379380381382383384
E F L R V E C V W I G S P E F V E E T R D K T L
E F L R V E C V W I - - - - - - - - - R D K T L
CTCTGTTTTTACGAACTTTATTGCTCTATC---------------------------TCCAATGTCCTTAAA
385386387388389390391392393394395396397398399400401402403404405406407408
K Y A E K L A E K L D L E Y W V E V G D D P F Y
K Y A E K L A E - - - - - - - - - - - - - - - -
AGTTAAGATAATTTTGTTTCCTTC------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
L E G R K K E D R G I E F P D V P K Y E M R L W
- - - - - - - - - - - - - - - - - K Y E M R L -
---------------------------------------------------TCTAACTCCAATTCTAAA---
433434435436437438439440441442443444445446447448449450451452453454455456
L P H I K D E R K G V A V T S A N V H G T H F V
- - - - - - - - - - - A V T S A N V H - - - - -
---------------------------------TCTAATTAATCCTTCATGAGCTCT---------------
457458459460461462463464465466467468469470471472473474475476477478479480
E G F R I K D Y K G R R V W T G C T G Y G I T R
- - - - - - - - - - - - V W T G C T G - G I T R
------------------------------------ATAGCTTTTTATTTTTGATGC---ATTTTCTTTACC
481482483484485486487488489490491492493494495496497498499500501502503504
W V V G Y L A Q Y G F N F D D W H P I I K K K I
W V V G - - - - - - - - - - - - - - - - - - - -
CTTTGGAACACC------------------------------------------------------------
505506507508509510511512513514515516517518519520521
K K L P E V P Q L I T W P K K D E
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_ser_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T W S L L R Y L R E S P D V L R E S L R K R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
M D P S M V D R L R G L D E Q W R R L K R T V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E I R H K H N V I T H S I A R T K D P E E R R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L I E E A K R L L K E R E R L E A E L K R V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E R E R L L L S L P N I V H E S V P V G E S D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y N M P I R F W G R P K V Y R G F L D R F R E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T E K W G F K V D Y E V I D W K P V G H A D M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E R V L K L G N T A K A A E V A G S R F Y Y L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D D L V W L D F A L L M Y A I D K L T S K G Y R
- - - - - L D F A L L M Y A I D K L T S K G Y R
---------------GAGGCCCGCCAGCGGGTGCTCGGCCGTAGCTATGAGGTAGAGATCCTCGCCCTCAAC
217218219220221222223224225226227228229230231232233234235236237238239240
L V L P P Y M I R H R I L M G V I D M E T F R D
L V L P P Y M I - - - - - - - - - - - - - - - -
CTTGTATATGGCGTCCCTAAACGT------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A I Y K V E G E D L Y L I A T A E H P L A G L Y
- - - - - - - - - - Y L I A T A E H P L A - - -
------------------------------AAGCTTGTCTATCGCGTACATGAGCAGGGCAAA---------
265266267268269270271272273274275276277278279280281282283284285286287288
S N E E I M E D E L P I K L V G V S P C F R K E
- - - - - - - - - - - I K L V G V S P C F R K -
---------------------------------GCCAGCCACCTCGGCGGCCTTTGCAGTGTTGCCTAG---
289290291292293294295296297298299300301302303304305306307308309310311312
A G A G N R D L K G I F R V H Q F H K V E Q F V
- - - - - - - - - - - - - - H Q F H K V E Q F V
------------------------------------------GTCAATAACCTCGTAGTCTACCTTGAAGCC
313314315316317318319320321322323324325326327328329330331332333334335336
Y A K P E E S W D I L E E L I R N A E E L F Q G
Y - - - - - - - - - L E E L I R N A E E L F Q -
CCA---------------------------AAGGAAGCCGCGGTAGACCTTGGGCCTCCCCCAGAACCT---
337338339340341342343344345346347348349350351352353354355356357358359360
L G I P Y R V V N A A S G E L G A P A A K K Y D
- - - - - - - - - - - - - - - - - - - - - K Y D
---------------------------------------------------------------GAGAAGCAG
361362363364365366367368369370371372373374375376377378379380381382383384
L E A W M P A Q G R Y R E M V S A S N T T D W Q
L E A - - - - - - - - - E M V S A S N T - - - -
TCTCTCCCG---------------------------CTCGAGCCTCTCCCTCTCTTTTAG------------
385386387388389390391392393394395396397398399400401402403404405406407408
S Y R L N I R L V R R K G M V R E Y V H T L N S
- - - - - - - - - - - - - - - - - - V H T L N S
------------------------------------------------------TGTAATCACGTTATGCTT
409410411412413414415416417418419420421422423424425426427428429430431432
T A I A S T R T I T A I L E N F Q E P D G T V V
T A . A S T R T I T A - - - - - - - - - - - - -
ATGCCT---CTCGTCGACGGTACGCTTGAGCCT---------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
I P K V L R K Y L E P F S K A P K E A I Y P A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459
K R E
- - -
---------
Class II
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_ser_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L S R Q F V R E H P E A V R D A L A K K G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A D V S R I L E V D E E W R E L K S R G D T L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
H E R N E V S S K I G Q L K Q E G D E E A A Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A I D R S G E L K A E L E E V E D R A D E L E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L E R K L L T L P M I P D D D V P V G A D E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E N V E R R R E G F D D L R D L P V E V V P H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D L G E D L D I L D F E R G A K V S G G G F Y F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A K G A G A R L E H A L V Q F M L D V H R E Q G
- - - - - - - L E H A L V Q F M L D V H R E Q G
---------------------CTCGAACACGCGCTCGTCCAGTTCATGCTCGACGTCCACCGCGAGCAGGGC
193194195196197198199200201202203204205206207208209210211212213214215216
Y V D V F P P I P V N S K S M E G T G Q F P K F
Y V D V F P P I P V - - - - - - - - - - - - - -
TACGTCGACGTCTTCCCGCCCATCCCGGTG------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V E D A Y R V G D V N E A D Y E D D D L W L L P
- - - - - - - - - - - - - - - - - - - - W L L P
------------------------------------------------------------TGGCTGCTTCCG
241242243244245246247248249250251252253254255256257258259260261262263264
T S E V P V T N M Y R D E I L L S D D L P L K H
T S E V P V T - - - - - - - - - - - - - - L K H
ACCTCGGAGGTACCGGTGACG------------------------------------------CTGAAACAC
265266267268269270271272273274275276277278279280281282283284285286287288
Q A Y S P N F R R E A G E H G T E T R G I V R V
Q A Y S P N F R R - - - - - - - - - - - - - - -
CAAGCGTACTCGCCGAACTTCCGGCGC---------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H Q F N K V E M V N F V E P E E S Y E R F E G L
H Q F N K V E M V N F - - - - - - - - - F E G L
CACCAGTTCAACAAGGTGGAGATGGTGAACTTC---------------------------TTCGAGGGTCTC
313314315316317318319320321322323324325326327328329330331332333334335336
V D E A E E V L R R L E L P Y R I L E M C T G D
V D E A E E V L R - - - - - - - - - - - - - - -
GTCGACGAGGCCGAGGAGGTCCTCCGG---------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
L G F T Q A K K Y D I E V W A P G D E M D E G P
- - - - - - - K Y D I E V - - - - - - - - - - -
---------------------AAGTACGACATCGAGGTG---------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A E G G R W L E V S S V S N F E D F Q A R R A G
- - - - - - - E V S S V S N F - - - - - - - - -
---------------------GAGGTCTCGTCGGTGTCGAACTTC---------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I Q Y R P E R H E S A E H L H T L N G S G L A I
- - - - - - - - - - - - - L H T L N G S G . A I
---------------------------------------CTCCACACGCTGAACGGGTCGGGG---GCCATC
409410411412413414415416417418419420421422423424425426427428429430431432
P R V M V A I L E Y Y Q N D D G T V D V P E A L
P R V M V A - - - - - - - - - - - - - - - - - -
CCCCGCGTGATGGTCGCC------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q P Y M N G Q A V I E G T Q K V G E S A L G D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460
E R E A
- - - -
------------
Class II
Bacteria/Escherichia coli/amino acid sequences/Ecoli_ser_aa
Bacteria/Escherichia coli/nucleotide sequences/Ecoli_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D P N L L R N E P D A V A E K L A R R G F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L D V D K L G A L E E R R K V L Q V K T E N L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A E R N S R S K S I G Q A K A R G E D I E P L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L E V N K L G E E L D A A K A E L D A L Q A E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R D I A L T I P N L P A D E V P V G K D E N D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V E V S R W G T P R E F D F E V R D H V T L G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
M H S G L D F A A A V K L T G S R F V V M K G Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I A R M H R A L S Q F M L D L H T E Q H G Y S E
- - - M H R A L S Q F M L D L H T E . H G Y S E
---------ATGCACCGCGCACTGTCGCAGTTTATGCTGGATCTGCATACCGAA---CATGGCTACAGTGAG
193194195196197198199200201202203204205206207208209210211212213214215216
N Y V P Y L V N Q D T L Y G T G Q L P K F A G D
N Y V P Y L V - - - - - - - - - - - - - - - - -
AACTATGTTCCGTACCTGGTT---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L F H T R P L E E E A D T S N Y A L I P T A E V
- - - - - - - - - - - - - - - - A L I P T A E V
------------------------------------------------GCGCTGATCCCAACGGCAGAAGTT
241242243244245246247248249250251252253254255256257258259260261262263264
P L T N L V R G E I I D E D D L P I K M T A H T
P L T - - - - - - - - - - - - - - I K M T A H T
CCGCTGACC------------------------------------------ATTAAGATGACCGCCCACACC
265266267268269270271272273274275276277278279280281282283284285286287288
P C F R S E A G S Y G R D T R G L I R M H Q F D
P C F R S - - - - - - - - - - - - - - - H Q F D
CCATGTTTCCGTTCT---------------------------------------------CACCAGTTCGAC
289290291292293294295296297298299300301302303304305306307308309310311312
K V E M V Q I V R P E D S M A A L E E M T G H A
K V E M V Q I - - - - - - - - - L E E M T G H A
AAAGTTGAAATGGTGCAGATC---------------------------CTGGAAGAGATGACCGGTCATGCG
313314315316317318319320321322323324325326327328329330331332333334335336
E K V L Q L L G L P Y R K I I L C T G D M G F G
E K V L Q - - - - - - - - - - - - - - - - - - -
GAAAAAGTCCTGCAG---------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
A C K T Y D L E V W I P A Q N T Y R E I S S C S
- - - T Y D L E V - - - - - - - - - E I S S C S
---------ACTTACGACCTGGAAGTA---------------------------GAGATCTCTTCCTGCTCC
361362363364365366367368369370371372373374375376377378379380381382383384
N V W D F Q A R R M Q A R C R S K S D K K T R L
N V - - - - - - - - - - - - - - - - - - - - - -
AACGTT------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V H T L N G S G L A V G R T L V A V M E N Y Q Q
V H T L N G S G . A V G R T L V A - - - - - - -
GTTCATACCCTGAACGGTTCTGGT---GCTGTTGGTCGTACGCTGGTTGCA---------------------
409410411412413414415416417418419420421422423424425426427428429430
A D G R I E V P E V L R P Y M N G L E Y I G
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_ser_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I K L I R E Q P D E V K R Q L A R C G V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G A I I D Q V L A F D E Q R R R L I Y E V E T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K A E R N A V S K Q I G A M K D Q A E R Q A K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E A M R R L G D E I A E L D R Q L A A V E E Q Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R A A M L E I R N L P H P D V P D G V D E H D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V V V Y Q E G E E R Q L P F P A R P H W E L G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A L G I L D F E R G V K L A G S R F Y V M R G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G A R L Q R A V I Q W L L D L H L R Q G Y Q E I
- - - L Q R A V I Q W L L D L H L R Q G Y Q E I
---------CGTATAGGCGGCGTGGTAGATCGGCAACTGACTCGCCTCCAGAATCTCGTCGGCGTAGAGACC
193194195196197198199200201202203204205206207208209210211212213214215216
Y T P F V V K E S V L W A S G Q L P K F R D N L
Y T P F V V - - - - - - - - - - - - - - - - - -
GGTCAGCGGCACTTCCGC------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y R D E E S G L W L V P T A E V P L T G L Y A D
- - - - - - - - W L V P T A E V P L T - - - - -
------------------------CAACACCGACTCTTTCACCACAAACGGTGTATA---------------
241242243244245246247248249250251252253254255256257258259260261262263264
E I L E A S Q L P I Y H A A Y T P C F R K E Q L
- - - - - - - - - I Y H A A Y T P C F R K - - -
---------------------------CTGGATCACCGCACGTTGCAGCCGCGCACCGGCACC---------
265266267268269270271272273274275276277278279280281282283284285286287288
S A G R D V R G I K R G H Q F D K V E M Y M F V
- - - - - - - - - - - - H Q F D K V E M Y M F -
------------------------------------GAAGTCGAGAATGCCCAACGCTTCACCAAGCTC---
289290291292293294295296297298299300301302303304305306307308309310311312
K P E E S Y Q A L E K L R R D A E E C A R L L G
- - - - - - - - L E K L R R D A E E C A R - - -
------------------------TTGACGTTCTTCTCCCTCTTGATAGACAACCACGTTATC---------
313314315316317318319320321322323324325326327328329330331332333334335336
L P F R T K L L C T A D L G F G S T K T Y D I E
- - - - - - - - - - - - - - - - - - - T Y D I E
---------------------------------------------------------TTGCTGCTCTTCAAC
337338339340341342343344345346347348349350351352353354355356357358359360
V W A P G V G E W L E V S S C S N V E A F Q A R
V - - - - - - - - - E V S S C S N V - - - - - -
GGC---------------------------CTCATCACCCAATCGGCGCATTGC------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A N I R Y R P E P G A K P E F V H T L N G S G
- - - - - - - - - - - - - - - - V H T L N G S G
------------------------------------------------CTCTGCTTTGCGCGTTTCAACTTC
385386387388389390391392393394395396397398399400401402403404405406407408
L G L P R T I I A I M E N Y Q Q E D G S I L I P
. G L P R T I I A - - - - - - - - - - - - - - -
---AATCAGACGACGCCGTTGCTCATC---------------------------------------------
409410411412413414415416417418419420421422423424425426
E V L R P Y M G G M E R I V N E A A
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_ser_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D L K N L Q N N F D E V A K K L K N K K V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E N I L K K L A E L F A S L K K E K I A L E E F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Q A F Q N K F S K E L A T A E D K E S L K A K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S E N K S K I N E Q S A K V N A L E N E L E E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A H A I P N I P D E C V P V G E D E N E N V E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K K V L N P P S F D F T P K E H F E L G E S L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
W L D F M R G V K I S Q S R F C V L K N E G A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L S R A L V N Y M I D F N R S R G F E F V N V P
L S R A L V N Y M I D F N R S R G F E F V N V P
TTAAGCCGTGCTTTGGTAAATTATATGATAGATTTTAATAGAAGTCGTGGATTTGAATTTGTTAATGTACCT
193194195196197198199200201202203204205206207208209210211212213214215216
F L V N G A T M F G T G Q L P K F K E D M Y K V
F L V - - - - - - - - - - - - - - - - - - - - -
TTTTTGGTA---------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D D E D L Y L I S T S E I P V T N L Y S G E I L
- - - - - Y L I S T S E I P V T - - - - - - - -
---------------TATTTGATCTCAACTTCTGAAATTCCAGTAACC------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A S E T L P I K M T C Y S A C F R K E A G S A G
- - - - - - I K M T C Y S A C F R K - - - - - -
------------------ATAAAAATGACTTGTTATAGTGCTTGTTTTAGAAAA------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R D T R G I I R Q H Q F E K V E L V S I T K P E
- - - - - - - - - H Q F E K V E L V S I - - - -
---------------------------CACCAGTTTGAAAAAGTAGAGCTTGTAAGTATC------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q S D S V F N E M L E C A S D L L S S L G L A H
- - - - - F N E M L E C A S D L L S - - - - - -
---------------TTTAATGAAATGCTTGAGTGTGCAAGTGATTTGCTGAGT------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R H L M L C T G D L G F S A A K T V D L E V W L
- - - - - - - - - - - - - - - - T V D L E V - -
------------------------------------------------ACTGTAGATCTTGAAGTG------
337338339340341342343344345346347348349350351352353354355356357358359360
P G Q N K Y R E I S S V S N C R D F Q A R R A K
- - - - - - - E I S S V S N C - - - - - - - - -
---------------------GAGATCAGCTCGGTTTCAAATTGT---------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I R Y K N E Q G K N E L V H T L N G S S L A V G
- - - - - - - - - - - - V H T L N G S S . A V G
------------------------------------GTCCACACTCTTAATGGCTCATCT---GCAGTAGGA
385386387388389390391392393394395396397398399400401402403404405406407408
R T L V A I M E N Y Q D K E G K I H I P D V L K
R T L V A - - - - - - - - - - - - - - - - - - -
AGAACCTTGGTAGCG---------------------------------------------------------
409410411
K Y F
- - -
---------
Class II
Bacteria/Burkholderia thailandensis/amino acid sequences/Bthailandensis_ser_aa
Bacteria/Burkholderia thailandensis/nucleotide sequences/Bthailandensis_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I Q L L R K D L D G V A K R L A D R G Y T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L D V A A F S A L E A E R R A I Q T R T E E L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A R R N S L S K Q I G A M K G R G E D T S A V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A E V G G I G D E M K A S A V K L D E I Q A R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
S E L M L E M P N V P H E S V P V G R D E T E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V E V R R W G A P R Q F D F D V K D H V D V G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P L G L D F E T G A K L S G A R F T V L R G P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A R L H R A L A Q F M L D T H T Q Q H G Y S E T
- - L H R A L A Q F M L D T H T Q . H G Y S E T
------CTGCATCGCGCGCTCGCGCAGTTCATGCTGGACACGCACACGCAG---CACGGCTACAGCGAGACG
193194195196197198199200201202203204205206207208209210211212213214215216
Y T P Y I V N P D V L Y G T G Q L P K F A E D M
Y T P Y I V - - - - - - - - - - - - - - - - - -
TACACGCCTTACATCGTG------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F R V E K G G A E N T V T Q Y L I S T S E I S L
- - - - - - - - - - - - - - Y L I S T S E I S L
------------------------------------------TACCTGATCTCGACCTCGGAGATCTCGCTG
241242243244245246247248249250251252253254255256257258259260261262263264
T N T V R D S I V D A S A L P I K L T A H S P C
T - - - - - - - - - - - - - - I K L T A H S P C
ACG------------------------------------------ATCAAGCTGACCGCGCATTCGCCGTGC
265266267268269270271272273274275276277278279280281282283284285286287288
F R S E A G S Y G R D T R G M I R Q H Q F D K V
F R S - - - - - - - - - - - - - - - H Q F D K V
TTCCGCTCG---------------------------------------------CACCAGTTCGACAAGGTC
289290291292293294295296297298299300301302303304305306307308309310311312
E M V Q I V A P E A S Y A A L D E M V G H A E A
E M V Q I - - - - - - - - - L D E M V G H A E A
GAGATGGTGCAGATC---------------------------CTCGACGAGATGGTCGGCCACGCGGAGGCG
313314315316317318319320321322323324325326327328329330331332333334335336
I L Q T L E L P Y R V V A L C T G D M G F S A A
I L Q - - - - - - - - - - - - - - - - - - - - -
ATCCTGCAG---------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
K T F D L E V W L P A Q N T Y R E I S S C S N T
- T F D L E V - - - - - - - - - E I S S C S N T
---ACGTTCGACCTCGAGGTG---------------------------GAGATCTCGAGCTGCTCGAATACC
361362363364365366367368369370371372373374375376377378379380381382383384
E S F Q A R R M Q A R F R N A Q G K P E L V H T
- - - - - - - - - - - - - - - - - - - - - V H T
---------------------------------------------------------------GTGCATACG
385386387388389390391392393394395396397398399400401402403404405406407408
L N G S G L A V G R T L V A V L E N Y Q N A D G
L N G S G . A V G R T L V A - - - - - - - - - -
CTGAACGGCTCGGGC---GCGGTCGGCCGCACGCTCGTCGCG------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
S V T V P V A L R P Y M G G V E R I A A P S S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433
A
-
---
Class II
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_ser_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R R N F V C A S C I P A E P V L D L R L L R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N P E A T Q A R L D R R H S S Y D I Q P L L S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D Q Q V R Q W E Q E R T Q L Q A R S N E I G R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V G Q K M R E G A D P Q S E E I A A L R E E G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q L K Q Q I A D L E Q Q E R Q V R S E L D T Y L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L T L P N L P D E T V P L G S S E D E N R E I H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R W G D D R I R E G E F A P H W E I G E R L G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F D F E R S T R I A Q S R F V T L L G A G A A L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------CGG
193194195196197198199200201202203204205206207208209210211212213214215216
E R A L I A F M L D R Q T A A G Y T E V A P P Y
E R A L I A F M L D R Q T A A G Y T E V A P P Y
CACTTCTGCTGTCGGGGTCAGCCAGAGGTCGTCGCGATCGCAGCGGAAACTTTCTTCAGAAAATTTGGGCAG
217218219220221222223224225226227228229230231232233234235236237238239240
L I N S A S L T A S G Q L P K F S E E S F R C D
L I - - - - - - - - - - - - - - - - - - - - - -
CTGACC------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R D D L W L T P T A E V P L T S L Y R D E I L S
- - - - W L T P T A E V P L T - - - - - - - - -
------------CATGAAAGCGATCAAAGCTCGCTCCAAAGCCGC---------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A D Q L P L R Y C A Y T P C F R R E A G S Y G R
- - - - - L R Y C A Y T P C F R R - - - - - - -
---------------CGTCGAACGCTCGAAATCAAATAGTCCCAGTCGCTC---------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D T R G L I R L H Q F N K V E L Y Q F V H P D H
- - - - - - - - H Q F N K V E L Y Q F - - - - -
------------------------GTCGCCCCAGCGGTGGATCTCGCGGTTCTCGTC---------------
313314315316317318319320321322323324325326327328329330331332333334335336
S E A A H Q Q L L A N A E A I L Q A L E L P Y R
- - - - H Q Q L L A N A E A I L Q - - - - - - -
------------GTCGGGCAGATTCGGCAGGGTTAATAGGTAGGTGTCGAG---------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T I E L C T G D L G F S A Q K T Y D I E V W L P
- - - - - - - - - - - - - - - T Y D I E V - - -
---------------------------------------------TTCCCGGAGCGCTGCAAT---------
361362363364365366367368369370371372373374375376377378379380381382383384
S A G R Y R E I S S C S N C G D F Q A R R A N I
- - - - - - E I S S C S N C - - - - - - - - - -
------------------GCGCATTTTTTGGCCAACACTCCG------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R F K E A G Q K G T R F V H T L N G S G L A V G
- - - - - - - - - - - - V H T L N G S G . A V G
------------------------------------GAGGCTCAGCAGAGGCTGGATATC---GCTAGAGTG
409410411412413414415416417418419420421422423424425426427428429430431432
R T M A A V L E N Y Q Q P D G S V R V P E A L Q
R T M A A - - - - - - - - - - - - - - - - - - -
GCGGCGATCGAGGCG---------------------------------------------------------
433434435436437438439440441442443
P Y L R Q T V I G Q P
- - - - - - - - - - -
---------------------------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_ser_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L T I K Q I T E N T D A V I R G L E K K H F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
G A K E T I A Q V I E V N D K R R N T Q N Q L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K N L A E V N S L S K T I G Q L M K E G K K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A E V A K A R V A E I K E S N K T L Q A D M D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A A N D M L N L L Y T I P N I P Y D S V P E G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G A E D N V V E K M G G M E T Q L P T D A L P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
W E L A K K Y D L I D F D L G V K I T G A G F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V Y K G K G A Q L Q R A L I N F F L D E A R K S
- - - - - - - - L Q R A L I N F F L D E A R K S
------------------------ATCCAAAATGACGTCACGGTAGATATTAGTTACCGGAACTTCAGCCGT
193194195196197198199200201202203204205206207208209210211212213214215216
G Y T E I M P P T V V N A A S G Y G T G Q L P D
G Y T E I M P P T V V - - - - - - - - - - - - -
CGGAATCAGATAGAGATCGTCTACTTCGCAATG---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K E G Q M Y H C E V D D L Y L I P T A E V P V T
- - - - - - - - - - - - - Y L I P T A E V P V T
---------------------------------------TTCGGTATATCCGGATTTACGTGCTTCATCCAG
241242243244245246247248249250251252253254255256257258259260261262263264
N I Y R D V I L D E K Q L P I K N C A Y T Q C F
- - - - - - - - - - - - - - I K N C A Y T Q C F
------------------------------------------TTTGTAAACAGGAAAACCTGCACCGGTTAT
265266267268269270271272273274275276277278279280281282283284285286287288
R R E A G S Y G K D V R G L N R L H E F S K V E
R R - - - - - - - - - - - - - - - H E F S K V E
TTTTAC---------------------------------------------ATGGGGGAGTGCATCTGTGGG
289290291292293294295296297298299300301302303304305306307308309310311312
L V R I D K P E H S R Q S H Q E M L D H V E G L
L V R I - - - - - - - - - H Q E M L D H V E G L
AAGTTGAGTTTC---------------------------GTCCTCGGCACCAACACCTTCGGGCACACTGTC
313314315316317318319320321322323324325326327328329330331332333334335336
L Q K L E L P Y R I L R L C G G D M S F T A A L
L Q - - - - - - - - - - - - - - - - - - - - - -
ATAGGG------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
C F D F E V Y S E A Q K R W L E V S S V S N F D
C F D F E V - - - - - - - - - E V S S V S N F -
TGTTTTATTGCTCTCCTT---------------------------TTCAGCTTCTTCCTTTTTGCCTTC---
361362363364365366367368369370371372373374375376377378379380381382383384
T Y Q A N R L K C R Y R S G E K K T E L C H T L
- - - - - - - - - - - - - - - - - - - - C H T L
------------------------------------------------------------ATTTTGTGTATT
385386387388389390391392393394395396397398399400401402403404405406407408
N G S A L A L P R I V A A L L E N H Q T P E G I
N G S A . A L P R I V A A - - - - - - - - - - -
ACGTCTTTTGTC---CACTTCGATTACTTGGGCAATTGT---------------------------------
409410411412413414415416417418419420421422423424
R I P K A L V P Y C G F D M I D
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Geobacillus stearothermophilus/amino acid sequences/Gstearothermophilus_ser_aa
Bacteria/Geobacillus stearothermophilus/nucleotide sequences/Gstearothermophilus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D V K I L R A Q F E E V K E K L M Q R G G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L A N I D R F E Q L D K E R R R L I A E V E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K S K R N D V S Q Q I A A L K R E K K D A E P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I V Q M R E V G D R I K Q M D E H I R Q L E E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L N A L L L S I P N I P H E S V P V G Q S E E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N V E V R R W G E P R S F S F E P K P H W D I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D Q L G L L D F E R A A K V A G S R F V F Y K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L G A R L E R A L I N F M L D I H L D E F G Y E
- - - - L E R A L I N F M L D I H L D E . G Y E
------------CTTGAGCGGGCGTTAATCAACTTTATGCTTGACATCCATCTCGATGAA---GGCTATGAA
193194195196197198199200201202203204205206207208209210211212213214215216
E V L P P Y L V N R A S M I G T G Q L P K F A E
E V L P P Y L V - - - - - - - - - - - - - - - -
GAAGTGCTGCCCCCCTATTTGGTG------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D A F H L D S E D Y F L I P T A E V P V T N L H
- - - - - - - - - - F L I P T A E V P V T - - -
------------------------------TTTCTCATTCCGACAGCGGAAGTGCCGGTGACG---------
241242243244245246247248249250251252253254255256257258259260261262263264
R D E I L S A D D L P L Y Y A A Y S A C F R A E
- - - - - - - - - - - L Y Y A A Y S A C F R A -
---------------------------------CTTTACTATGCAGCGTACAGCGCCTGTTTCCGCGCT---
265266267268269270271272273274275276277278279280281282283284285286287288
A G S A G R D T R G L I R Q H Q F N K V E L V K
- - - - - - - - - - - - - - H Q F N K V E L V K
------------------------------------------CATCAGTTCAACAAAGTGGAGCTTGTTAAG
289290291292293294295296297298299300301302303304305306307308309310311312
F V K P E D S Y E E L E K L T R Q A E T I L Q R
F - - - - - - - - - L E K L T R Q A E T I L Q -
TTT---------------------------CTGGAAAAATTGACACGGCAGGCGGAAACGATTTTGCAG---
313314315316317318319320321322323324325326327328329330331332333334335336
L G L P Y R V V A L C T G D L G F S A A K T Y D
- - - - - - - - - - - - - - - - - - - - - T Y D
---------------------------------------------------------------ACATACGAT
337338339340341342343344345346347348349350351352353354355356357358359360
I E V W L P S Y G T Y R E I S S C S N F E A F Q
I E V - - - - - - - - - E I S S C S N F - - - -
ATTGAAGTA---------------------------GAAATTTCATCGTGCAGCAACTTT------------
361362363364365366367368369370371372373374375376377378379380381382383384
A R R A N I R F R R D P K A K P E Y V H T L N G
- - - - - - - - - - - - - - - - - - V H T L N G
------------------------------------------------------GTGCACACGTTAAACGGC
385386387388389390391392393394395396397398399400401402403404405406407408
S G L A I G R T V A A I L E N Y Q Q E D G S V I
S G . A I G R T V A A - - - - - - - - - - - - -
TCAGGG---GCCATCGGCCGAACGGTCGCCGCT---------------------------------------
409410411412413414415416417418419420421422423424
I P E A L R P Y M G N R D V I R
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_ser_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I R L F R E Q P E L V R E G F A K V G R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P G L V D Q V I G L D L K R R E A I T E V E R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K A E R N A G S K D V A R T K D K A E R D V K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A A M K L V G D Q I T E L D A Q A N A I D L E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
H N L L L D L P N L P L P E V P V G K D E H D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V V V R V E G T I Q E P D F A V K P H W E L G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A L G I L D F E R G V R M S G T R F F V M K G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G V R L Q R A L I S W M I D M H V D Q H G Y T E
- - - L Q R A L I S W M I D M H V D Q . G Y T E
---------GCGTAATGGCAATTGAGCTTTATCTAAAATTTCTTCGCGATGCAAGTT---AACTGGCACTTC
193194195196197198199200201202203204205206207208209210211212213214215216
L A V P Y L V K A D A M V G T G N L P K F A D T
L A V P Y L V - - - - - - - - - - - - - - - - -
AGCGGTCGGAATCAGCCATAA---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I F H I E D T D L W L I P T A E V P V T N L H R
- - - - - - - - - W L I P T A E V P V T - - - -
---------------------------CAAGTAGGGCACGGCCAATTCGGTGTAACCATG------------
241242243244245246247248249250251252253254255256257258259260261262263264
E E I L D K A Q L P L R Y V A H T P C F R N E Q
- - - - - - - - - - L R Y V A H T P C F R N - -
------------------------------TTGCAAGCGCACGCCCAAGCCTTTCATCACGAAAAA------
265266267268269270271272273274275276277278279280281282283284285286287288
M S A G R D V R G I K R L Y Q F D K V E M V K M
- - - - - - - - - - - - - Y Q F D K V E M V K M
---------------------------------------GAGGGCTTCGCCTAGCTCCCAGTGTGGCTTAAC
289290291292293294295296297298299300301302303304305306307308309310311312
V E P A T S Y D E L F S L I S N A E D V C K G L
- - - - - - - - - L F S L I S N A E D V C K - -
---------------------------TTCGACCCGCACCACAACATTATCGTGTTCATCCTTGCC------
313314315316317318319320321322323324325326327328329330331332333334335336
K I P Y R L L Q L C T A D L G I A T V K Y D L E
- - - - - - - - - - - - - - - - - - - K Y D L E
---------------------------------------------------------GATTGCATTTGCCTG
337338339340341342343344345346347348349350351352353354355356357358359360
M W A P G M N E W L E V S S C G L F G D Y Q A R
M - - - - - - - - - E V S S C G L F - - - - - -
TGC---------------------------CAGCTTCATGGCGGCAATTTTCAC------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A N I R Y R P E A G A K P E F V H T L N G S G
- - - - - - - - - - - - - - - - V H T L N G S G
------------------------------------------------CCGCTCAACTTCGGTAATCGCCTC
385386387388389390391392393394395396397398399400401402403404405406407408
L A L P R V I I A I L E N Y Q N A D G S V T V P
. A L P R V I I A - - - - - - - - - - - - - - -
---CCGTTTAAGATCCAAGCCAATCAC---------------------------------------------
409410411412413414415416417418419420421422
E V L R P Y M G G I E R I G
- - - - - - - - - - - - - -
------------------------------------------
Class II
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_ser_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D I K L I R Q N P D F V K E A L R K R G E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P A I I D E I L K I D A D W R A T I T K T N E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R S R R N E I S K N V A R L K K E G K N A E A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A L I E E G K R L G E E I K A L E E K E K E L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K K L N D L L L M I P N I P H E S V P V G E D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S Q N V E V R R W G E P R E F D F T P L A H W D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L G P A W G L M D F S R A S K L S G S R F T V M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y G K L A R L E R A L I N F M L D V H T K E H G
- - - - - - L E R A L I N F M L D V H T K E . G
------------------CTCGAGAGGGCTCTGATAAACTTCATGCTTGACGTTCATACAAAGGAA---GGT
193194195196197198199200201202203204205206207208209210211212213214215216
Y T E V W V P H L V K R E T I T I T G Q L P K F
Y T E V W V P H L V - - - - - - - - - - - - - -
TACACGGAAGTGTGGGTTCCACACCTGGTG------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E E E L Y L A E R D D L F L I P T A E V P L A A
- - - - - - - - - - - - F L I P T A E V P L A -
------------------------------------TTCCTCATTCCGACGGCTGAGGTTCCCCTCGCA---
241242243244245246247248249250251252253254255256257258259260261262263264
L H S G E I L E E K E L P K K Y V S Y T P C Y R
- - - - - - - - - - - - - K K Y V S Y T P C Y R
---------------------------------------AAGAAATACGTCTCTTACACTCCCTGTTACCGC
265266267268269270271272273274275276277278279280281282283284285286287288
R E A G S Y G K D V R G M I R Q H Q F D K V E L
R - - - - - - - - - - - - - - - H Q F D K V E L
AGA---------------------------------------------CATCAATTCGACAAGGTCGAGCTC
289290291292293294295296297298299300301302303304305306307308309310311312
V W V T T P E R S F E D L E E L V K D A E T I L
V W V - - - - - - - - - L E E L V K D A E T I L
GTCTGGGTG---------------------------CTTGAAGAGCTTGTGAAAGACGCCGAAACCATTCTT
313314315316317318319320321322323324325326327328329330331332333334335336
R K L E L P Y R V V S L C T G D L G F T S A K T
R - - - - - - - - - - - - - - - - - - - - - - T
AGA------------------------------------------------------------------ACC
337338339340341342343344345346347348349350351352353354355356357358359360
Y D I E V W L P S Y N A Y K E I S S C S N V T D
Y D I E V - - - - - - - - - E I S S C S N V - -
TACGATATAGAAGTG---------------------------GAGATATCTTCCTGCAGTAACGTG------
361362363364365366367368369370371372373374375376377378379380381382383384
F Q A R R G N M R Y R R R S D G K L E Y V H T L
- - - - - - - - - - - - - - - - - - - - V H T L
------------------------------------------------------------GTTCACACGTTG
385386387388389390391392393394395396397398399400401402403404405406407408
N G S G I A V G R A L V A I L E N Y Q Q P D G S
N G S G . A V G R A L V A - - - - - - - - - - -
AACGGATCGGGT---GCCGTTGGAAGGGCACTCGTTGCG---------------------------------
409410411412413414415416417418419420421422423424425
V R V P E V L V P Y T G F E V I P
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Aquifex aeolicus/amino acid sequences/Aaeolicus_ser_aa
Bacteria/Aquifex aeolicus/nucleotide sequences/Aaeolicus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D I N L I R E K P D Y V K E R L A T R D K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L V S L V D K V L E L D K R R R E I I K R L E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L R S E R N K L S K E I G K L K R E G K D T T E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I Q N R V K E L K E E I D R L E E E L R K V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E L K N T L L W I P N L P H P S V P V G E D E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D N V E V R R W G E P R K F D F E P K P H W E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G E R L G I L D F K R G A K L S G S R F T V I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
G W G A R L E R A L I N F M L D L H T K K G Y K
- - - - - L E R A L I N F M L D L H T K K G Y K
---------------ATATATGGGAAGGTTCTCTTCCTTGAGTATCTCTTCTCTGTAGAGGTTTGTCAGGGG
193194195196197198199200201202203204205206207208209210211212213214215216
E I C P P H L V K P E I L I G T G Q L P K F E E
E I C P P H L V - - - - - - - - - - - - - - - -
AACTTCCGCGGTGGGTATCAGGTA------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D L Y K C E R D N L Y L I P T A E V P L T N L Y
- - - - - - - - - - Y L I P T A E V P L T - - -
------------------------------TACCAAATGGGGAGGACATATTTCCTTGTAGCC---------
241242243244245246247248249250251252253254255256257258259260261262263264
R E E I L K E E N L P I Y L T A Y T P C Y R R E
- - - - - - - - - - - I Y L T A Y T P C Y R R -
---------------------------------TTCTAATCTCGCACCCCAGCCGGCTATTACGGTAAA---
265266267268269270271272273274275276277278279280281282283284285286287288
A G A Y G K D I R G I I R Q H Q F D K V E L V K
- - - - - - - - - - - - - - H Q F D K V E L V K
------------------------------------------CAATCTTTCCCCTATTTCCCAGTGAGGTTT
289290291292293294295296297298299300301302303304305306307308309310311312
I V H P D T S Y D E L E K L V K D A E E V L Q L
I - - - - - - - - - L E K L V K D A E E V L Q -
TGG---------------------------CCATCTCCTTACTTCCACGTTGTCCTTTTCGTCCTCTCC---
313314315316317318319320321322323324325326327328329330331332333334335336
L G L P Y R V V E L C T G D L G F S A A K T Y D
- - - - - - - - - - - - - - - - - - - - - T Y D
---------------------------------------------------------------TTTCCTTAA
337338339340341342343344345346347348349350351352353354355356357358359360
I E V W F P S Q N K Y R E I S S C S N C E D F Q
I E V - - - - - - - - - E I S S C S N C - - - -
CTCTTCCTC---------------------------CTTTACTCTGTTTTGTATTTCCGT------------
361362363364365366367368369370371372373374375376377378379380381382383384
A R R M N T R F K D S K T G K N R F V H T L N G
- - - - - - - - - - - - - - - - - - V H T L N G
------------------------------------------------------GGCTTCAAGTCTTTTTAT
385386387388389390391392393394395396397398399400401402403404405406407408
S G L A V G R T L A A I L E N Y Q Q E D G S V V
S G . A V G R T L A A - - - - - - - - - - - - -
TATTTC---TCTCCTTTTGTCAAGTTCAAGAAC---------------------------------------
409410411412413414415416417418419420421422423424425
V P E V L R D Y V G T D V I R P E
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Chroococcidiopsis thermalis/amino acid sequences/Cthermalis_ser_aa
Bacteria/Chroococcidiopsis thermalis/nucleotide sequences/Cthermalis_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I K Q I R E N P Q T V Q E R L Q R R G D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
D L Q P L L E L D R Q Q R E L E Q A R S Q L Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R S N E I G K L V G Q K I K S G S S P D S P E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Q D L R E E G N T I K T R L S E L E P Q E R E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K E Q I E T F L L T I P N L P S D S T P I G K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E T E N I E V R R W G D E Y L P Q N A N I L P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
W E I G E K L G L L N F E R S T K I A Q S R F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S L I G I G A Q L E R A L I Q F M L D R Q T A A
- - - - - - - - L E R A L I Q F M L D R Q T A A
------------------------CAAATCTTCTGCTGTTAAAATTTCCCCTCGATAGAAATTAGTAATTGG
193194195196197198199200201202203204205206207208209210211212213214215216
G Y V E I I P P F L I N S Q S L T A S G Q L P K
G Y V E I I P P F L I - - - - - - - - - - - - -
AACTTCAGCTGTGGGACTGAGCCACAGATCGTC---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F A E E S F K C A N D D L W L S P T A E V P I T
- - - - - - - - - - - - - W L S P T A E V P I T
---------------------------------------GGGTGGGATAATTTCTACATAACCTGCGGCGGT
241242243244245246247248249250251252253254255256257258259260261262263264
N F Y R G E I L T A E D L P I N H C A Y T P C F
- - - - - - - - - - - - - - I N H C A Y T P C F
------------------------------------------CGCCCCAATACCAATTAAACTGACAAAACG
265266267268269270271272273274275276277278279280281282283284285286287288
R R E A G S Y G R D T R G L I R L H Q F N K V E
R R - - - - - - - - - - - - - - - H Q F N K V E
GCTTTG---------------------------------------------ACCAATTTCCCAATGGGGCAG
289290291292293294295296297298299300301302303304305306307308309310311312
L Y K F V H P D T S E Q E H Q K L L H D A E A I
L Y K F - - - - - - - - - H Q K L L H D A E A I
AATGTTCGCGTT---------------------------CCGCACTTCAATGTTTTCTGTTTCGTTTTTGCC
313314315316317318319320321322323324325326327328329330331332333334335336
L Q A L Q L P Y R V L E L C T G D L G F S S T K
L Q - - - - - - - - - - - - - - - - - - - - - -
AATCGG------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T Y D L E V W L P S S E K Y R E I S S C S N C M
T Y D L E V - - - - - - - - - E I S S C S N C -
TTCTTGCGGTTCGAGTTC---------------------------TTCTTCTCGCAAATCTTGCACTTC---
361362363364365366367368369370371372373374375376377378379380381382383384
D F Q A R R G S I R F K E A G K K G T Q Y V H T
- - - - - - - - - - - - - - - - - - - - - V H T
---------------------------------------------------------------GGCTTGGAG
385386387388389390391392393394395396397398399400401402403404405406407408
L N G S G L A V G R T M A A I L E N Y Q Q P D G
L N G S G . A V G R T M A A - - - - - - - - - -
TTGCGATCGCGCTTG---TAATTCCCGCTGTTGACGGTCTAA------------------------------
409410411412413414415416417418419420421422423424425426427428
T I K V P E V L Q P Y L R R E V I G E R
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Bacteria/Mycobacterium smegmatis/amino acid sequences/Msmegmatis_ser_aa
Bacteria/Mycobacterium smegmatis/nucleotide sequences/Msmegmatis_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D L R L L R E N P D I V R A S Q R A R G E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P A L V D A L L A A D T A R R S A V S A A D N L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R A E Q K A A S K L V G K A S P D E R P A L L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R A K D L A E Q V K A A E A A Q A E A E Q A F T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A A H M A I S N V I F E G V P A G G E D D F V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L D T V G E P R A I E N P K D H L E L G E S L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L I D M E R G A K V S G S R F Y F L T G A G A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L Q L G L L Q L A T Q V A V Q N G F T L M I P P
L Q L G L L Q L A T Q V A V Q N G F T L M I P P
GGCGTAACGGCGCGGTCCCGCGGACAGGTCGAGGATCTCGTCGGCGTGGTAACCGGCCAGCGGCACCTCCGA
193194195196197198199200201202203204205206207208209210211212213214215216
V L V R P E V M R G T G F L G A H A D E V Y R L
V L V - - - - - - - - - - - - - - - - - - - - -
GGTCCCGAC---------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E A D D M Y L V G T S E V P L A G Y H A D E I L
- - - - - Y L V G T S E V P L A - - - - - - - -
---------------GGGACGCACCAGCACGGGCGGGATCATGAGCGT------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D L S A G P R R Y A G W S S C F R R E A G S Y G
- - - - - - R R Y A G W S S C F R R - - - - - -
------------------CCCGAGCTGAAGCAGCGCACCGGCACCGGTCAAGAA------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K D T R G I I R V H Q F D K V E G F I Y C K P E
- - - - - - - - - H Q F D K V E G F I Y - - - -
---------------------------CAGGCCGAGCGACTCACCGAGCTCCAGGTGGTC------------
289290291292293294295296297298299300301302303304305306307308309310311312
D A E A E H Q R L L G W Q R E M L A A I E V P Y
- - - - - H Q R L L G W Q R E M L A - - - - - -
---------------ACCCACGGTGTCGAGCACCACGAAGTCGTCCTCGCCGCC------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R V I D V A A G D L G S S A A R K Y D C E A W V
- - - - - - - - - - - - - - - - K Y D C E A - -
------------------------------------------------CTCGGCCTGCGCGGCCTC------
337338339340341342343344345346347348349350351352353354355356357358359360
P T Q Q T Y R E L T S T S N C T T F Q A R R L S
- - - - - - - E L T S T S N C - - - - - - - - -
---------------------CTTGGCCCGCTGCAGCAGGGCCGG---------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
T R Y R D D N G K P Q I A A T L N G T L A T T R
- - - - - - - - - - - - A A T L N G T L A T T R
------------------------------------GTCGGCGGCCGACACCGCCGAGCGGCGTGCCGTATC
385386387388389390391392393394395396397398399400401402403404405406407408
W L V A I L E N H Q Q P D G S V R V P A A L V P
W L V A - - - - - - - - - - - - - - - - - - - -
GGCGGCCAGCAG------------------------------------------------------------
409410411412413414415416417
Y V R T E V L E P
- - - - - - - - -
---------------------------
Class II
Bacteria/Mycoplasma mobile/amino acid sequences/Mmobile_ser_aa
Bacteria/Mycoplasma mobile/nucleotide sequences/Mmobile_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I K L I L K N K D F V I S K L K Q R S N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N V S E I E K L Y T L G T E R A N I L I S L S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L Q S K R N E I S S K I G E A K R N K T D A L F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
F M D E V E N I K K E L S I L E E K S T K I E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K I Q E L I S F I P N I P L D D V P F G K D D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D N V I L K E F P K I G R G L V K A K K P H Y E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I G V E K D L I D F S R G A K L S G S R F I V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K N A G A K L I R A L E S F M L D T H E K N G Y
- - - - - - L I R A L E S F M L D T H E K N G Y
------------------CAAATCGATTATTTCATTATTAAATAAATTAGTAACTGGCACTTCTGCTGTTGG
193194195196197198199200201202203204205206207208209210211212213214215216
S E I M P P F L V N S K M M Y G T G Q L P K F K
S E I M P P F L V - - - - - - - - - - - - - - -
AATTAAATATAAATCATGACCCTCTAT---------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E D L F K I E G H D L Y L I P T A E V P V T N L
- - - - - - - - - - - Y L I P T A E V P V T - -
---------------------------------TATTTCACTATAACCATTTTTTTCATGAGTATC------
241242243244245246247248249250251252253254255256257258259260261262263264
F N N E I I D L E K N S K F S S F T N C F R S E
- - - - - - - - - - - S K F S S F T N C F R S -
---------------------------------AGCATTTTTGTAGACAATAAATCTTGAACCACTCAA---
265266267268269270271272273274275276277278279280281282283284285286287288
A G S A G R D T K G I I R L H Q F N K V E L V E
- - - - - - - - - - - - - - H Q F N K V E L V E
------------------------------------------TTCATAATGTGGTTTTTTAGCTTTAACAAG
289290291292293294295296297298299300301302303304305306307308309310311312
F A S E Q K S L R A F N S V L K N A K Y L L E L
F - - - - - - - - - F N S V L K N A K Y L L E -
TCC---------------------------AATGACATTATCAGTATCATCTTTTCCAAAAGGAACATC---
313314315316317318319320321322323324325326327328329330331332333334335336
L E I P Y R E V L L C T G D L G F S S R K T I D
- - - - - - - - - - - - - - - - - - - - - T I D
---------------------------------------------------------------TTCTTCCAA
337338339340341342343344345346347348349350351352353354355356357358359360
L E L W L P S E Q R Y R E V S S V S Y F G D F Q
L E L - - - - - - - - - E V S S V S Y F - - - -
AATACTTAG---------------------------CATAAAAAATAAAGCATCTGTTTT------------
361362363364365366367368369370371372373374375376377378379380381382383384
S R R S M I R Y R D E N K N T Q Y V H T I N G S
- - - - - - - - - - - - - - - - - V H T I N G S
---------------------------------------------------AGAAATCAATATATTTGCTCT
385386387388389390391392393394395396397398399400401402403404405406407408
G L A I D R V L A A I L E Q Y Q N D D G S I S V
G . A I D R V L A A - - - - - - - - - - - - - -
TTC---TCCTAATGTATATAATTTTTCAAT------------------------------------------
409410411412413414415416417418419420421
P K V L I P Y L N V E K I
- - - - - - - - - - - - -
---------------------------------------
Class II
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_ser_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I K L L R A N L E E I K Q K L A H R G E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L S D F D Q F E E L D T K R R E L I V K V E E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K G K R N E V S Q Q V A A L K R E K K D A D H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I K E M R E V G E D I K K L D E E L R T V E S S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L D K I M L S I P N I P H E S V P V G E T E D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N V E V R K W G E L P G F S F E P K P H W D I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D Q L D I L D F E R A G K V T G S R F V F Y K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L G A R L E R A L Y N F M L D L H V D E Y G Y T
- - - - L E R A L Y N F M L D L H V D E . G Y T
------------CTTGAACGCGCATTGTATAACTTTATGCTTGATCTCCACGTAGACGAG---GGCTATACG
193194195196197198199200201202203204205206207208209210211212213214215216
E V I P P Y M V N R A S M T G T G Q L P K F E E
E V I P P Y M V - - - - - - - - - - - - - - - -
GAAGTCATCCCGCCGTACATGGTG------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D A F K I R E E D Y F L I P T A E V P I T N L H
- - - - - - - - - - F L I P T A E V P I T - - -
------------------------------TTCTTAATTCCGACGGCGGAAGTGCCGATTACG---------
241242243244245246247248249250251252253254255256257258259260261262263264
R D E I L S A A E L P I N Y A A F S A C F R S E
- - - - - - - - - - - I N Y A A F S A C F R S -
---------------------------------ATCAATTATGCGGCGTTCAGTGCGTGCTTCCGTTCA---
265266267268269270271272273274275276277278279280281282283284285286287288
A G S A G R D T R G L I R Q H Q F N K V E L V K
- - - - - - - - - - - - - - H Q F N K V E L V K
------------------------------------------CACCAATTTAACAAGGTTGAACTGGTGAAA
289290291292293294295296297298299300301302303304305306307308309310311312
F V K P E D S Y E E L E K L T N Q A E K V L Q L
F - - - - - - - - - L E K L T N Q A E K V L Q -
TTT---------------------------CTTGAAAAACTGACAAATCAAGCGGAGAAGGTTCTTCAG---
313314315316317318319320321322323324325326327328329330331332333334335336
L E L P Y R V M S M C T G D L G F T A A K K Y D
- - - - - - - - - - - - - - - - - - - - - K Y D
---------------------------------------------------------------AAATACGAT
337338339340341342343344345346347348349350351352353354355356357358359360
I E V W I P S Q N T Y R E I S S C S N F E A F Q
I E V - - - - - - - - - E I S S C S N F - - - -
ATTGAAGTA---------------------------GAAATTTCATCATGCAGCAACTTT------------
361362363364365366367368369370371372373374375376377378379380381382383384
A R R A N I R F R R E A K G K P E H V H T L N G
- - - - - - - - - - - - - - - - - - V H T L N G
------------------------------------------------------GTCCATACGCTAAACGGA
385386387388389390391392393394395396397398399400401402403404405406407408
S G L A V G R T V A A L L E N Y Q Q E D G S V I
S G . A V G R T V A A - - - - - - - - - - - - -
TCCGGC---GCAGTCGGCAGAACGGTTGCCGCA---------------------------------------
409410411412413414415416417418419420421422423424425
I P K A L R P Y M G N R D V I Q P
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_ser_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D L K F I R D N L D L V K R S I K A R G L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L D I D K L I Y L D D K R K K L I T K I G E L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A K R N E N S S K M Q E N L D K V L K I S L I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T G K I L K K Q L I D L E E E L E R V S V D F D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E N K K V P N I L S P D V P I G S S E E D N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E I K R V G V V P Q F D F K P K D H L E L G R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L D L L D F D R A R E I S G S K F Y Y L K N E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V F L E I A L I N F S L N K L R D K G F D V F I
- - L E I A L I N F S L N K L R D K G F D V F I
------ATGTGAAAACCCTGCCATTCTTATTGGCAAAGTGAGATCTATTATTTTATTATAATAATAACCGCC
193194195196197198199200201202203204205206207208209210211212213214215216
T P D V A R E F I V D G I G F N P R G N E S N I
T P D V A - - - - - - - - - - - - - - - - - - -
AAGCGTAATTTCAGA---------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Y K I E D T D K Y L V G T S E I T L G G Y Y Y N
- - - - - - - - Y L V G T S E I T L G - - - - -
------------------------AACTATAAACTCTCTTGCAACATCAGGAGTAAT---------------
241242243244245246247248249250251252253254255256257258259260261262263264
K I I D L T L P I R M A G F S H C F R K E A G A
- - - - - - - - I R M A G F S H C F R K - - - -
------------------------GAAATTAATAAGAGCAATTTCTAAAAAAACTGCTTC------------
265266267268269270271272273274275276277278279280281282283284285286287288
Y G Q L S K G L Y R V H Q F S K V E M F C F C K
- - - - - - - - - - - H Q F S K V E M F C F - -
---------------------------------GTCAAAATCTAGAAGATCTAAATCTCTGCCAAG------
289290291292293294295296297298299300301302303304305306307308309310311312
A E E S G V I H D E F L S I Q E Q I F T E L E I
- - - - - - - H D E F L S I Q E Q I F T - - - -
---------------------AAACTGTGGAACAACTCCAACCCTTTTTATTTCAAAATT------------
313314315316317318319320321322323324325326327328329330331332333334335336
P Y R V L N I C S F D L G S P A Y K K Y D I E A
- - - - - - - - - - - - - - - - - - K Y D I E A
------------------------------------------------------GTCAAAATCAACAGATAC
337338339340341342343344345346347348349350351352353354355356357358359360
W M P G R D G K G G Y G E V T S T S N C T D Y Q
- - - - - - - - - - - - E V T S T S N C - - - -
------------------------------------TTTCAAAATCTTTCCGGTTTCTAT------------
361362363364365366367368369370371372373374375376377378379380381382383384
S R R L K I R Y K D Q D G Q N K F A H M V N G T
- - - - - - - - - - - - - - - - - A H M V N G T
---------------------------------------------------TGCATTAAGCTCACCAATTTT
385386387388389390391392393394395396397398399400401402403404405406407408
A I A T T R V I I S I L E N F Q D Q K G G V R I
A . A T T R V I I S - - - - - - - - - - - - - -
GGT---TAGTTTTTTTCTCTTATCATCAAG------------------------------------------
409410411412413414415416417418419420421422423424425
P K S L V K Y T G F D Y I P F K N
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_ser_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L E I N Y I Q E N K T S V I A K L H K R H L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N A A D L I E N I L T I N Q Q R K E T Q L A L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T T S S Q V N Q L T K Q I E Q L L Q E G K K Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I E S I K S Q S K V L K A S V K E L E L Q L N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y K E T L Q Q K L D E L P N L P H D N V P I G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D S T S N E I V Y Q V E S I P E H T A Q L I P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
W E L I T T Y N I I D F E L G N K L T G A G F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V Y K G K G A R L Q R A L I N F F L D E A R K A
- - - - - - - - L Q R A L I N F F L D E A R K A
------------------------CTACAAAGAGCTCTAATTAATTTTTTTCTTGATGAAGCTAGAAAAGCT
193194195196197198199200201202203204205206207208209210211212213214215216
G Y E E I Q P P I L V N K A S A Y G T G Q L P D
G Y E E I Q P P I L V - - - - - - - - - - - - -
GGCTATGAAGAAATACAGCCTCCTATACTTGTT---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K E G Q M Y E L A N E P L Y L I P T A E V P V T
- - - - - - - - - - - - - Y L I P T A E V P V T
---------------------------------------TATTTAATTCCTACTGCTGAAGTGCCTGTTACA
241242243244245246247248249250251252253254255256257258259260261262263264
N L Y R D Q I L S K D V L P I R H V A Y T P C F
- - - - - - - - - - - - - - I R H V A Y T P C F
------------------------------------------ATTAGGCATGTAGCTTATACACCTTGTTTT
265266267268269270271272273274275276277278279280281282283284285286287288
R R E A G S W G S H V R G L N R L H Q F D K V E
R R - - - - - - - - - - - - - - - H Q F D K V E
AGAAGA---------------------------------------------CATCAATTTGATAAGGTGGAA
289290291292293294295296297298299300301302303304305306307308309310311312
I V E I S L P E L S Y Q A L E T M R R Y V E S L
I V E I - - - - - - - - - L E T M R R Y V E S L
ATTGTAGAAATA---------------------------TTAGAAACTATGCGTAGATATGTTGAAAGCCTA
313314315316317318319320321322323324325326327328329330331332333334335336
V Q K L E L P Y R V L K L C S G D L G F A S A F
V Q - - - - - - - - - - - - - - - - - - - - - -
GTACAG------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
T Y D I E V F S V G Q N R W L E V S S I S N Y D
T Y D I E V - - - - - - - - - E V S S I S N Y -
ACTTATGATATAGAAGTT---------------------------GAAGTAAGTTCTATTAGCAATTAT---
361362363364365366367368369370371372373374375376377378379380381382383384
T Y Q A N R M Q L R Y K D N G H N R L L H T L N
- - - - - - - - - - - - - - - - - - - L H T L N
---------------------------------------------------------TTACATACTTTAAAC
385386387388389390391392393394395396397398399400401402403404405406407408
G S A I A L P R I M A A L L E L N F T E G K I K
G S A . A L P R I M A A - - - - - - - - - - - -
GGAAGTGCC---GCCTTACCAAGAATTATGGCAGCT------------------------------------
409410411412413414415416417418419420421422423
I P H A L T K Y T D F E Y I S
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_ser_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D L K F I R E N P D A V R E A I R V K N V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L D L D D L L Q R D R D L V A L K Q R V E A M Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T E R N A N A K L V P K A S P E D R P G L I Q K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G K D L S E D L K A L E P Q L R E Q E D A L K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L L L R V P N I P L P G V P V G K D E D D N V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L R R E G E L P G F D F T P L D Q V E I L E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G W A D F E R V A R V S G S R S Y L L K G D A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L L E M A V L M F A L D F L S Q R G F T P L S T
- L E M A V L M F A L D F L S Q R G F T P L S T
---CTGGAAATGGCGGTGCTGATGTTCGCGCTCGATTTCCTGTCGCAGCGCGGCTTTACTCCACTTTCGACC
193194195196197198199200201202203204205206207208209210211212213214215216
T A L V R R E T L V N S G H F P G D E E S V Y K
T A L V - - - - - - - - - - - - - - - - - - - -
ACGGCGCTCGTC------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
L E G D E L L L A G T A E V P I N S L Y A G E Q
- - - - - - L L A G T A E V P I N - - - - - - -
------------------CTGCTCGCTGGAACCGCCGAGGTGCCGATCAAT---------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L S A D E L P L T F A G F S A A F R R E A G S A
- - - - - - - L T F A G F S A A F R R - - - - -
---------------------CTGACCTTCGCGGGTTTCAGCGCCGCCTTCCGCCGC---------------
265266267268269270271272273274275276277278279280281282283284285286287288
G R D V R G L I R V H E F R K V E Q Y V L C R A
- - - - - - - - - - H E F R K V E Q Y V L - - -
------------------------------CACGAGTTCCGCAAGGTCGAGCAGTACGTCCTG---------
289290291292293294295296297298299300301302303304305306307308309310311312
D Q E E G L K W F E R L L S N A E G L L Q A L E
- - - - - - - - F E R L L S N A E G L L Q - - -
------------------------TTCGAGCGCCTGCTGAGCAACGCCGAGGGGCTGTTGCAG---------
313314315316317318319320321322323324325326327328329330331332333334335336
L P Y R V I Q N C T G D M G A G K V L M Y D I E
- - - - - - - - - - - - - - - - - - - M Y D I E
---------------------------------------------------------ATGTACGACATCGAA
337338339340341342343344345346347348349350351352353354355356357358359360
T W V P S E Q K Y R E T H S C S Y L G D W Q A R
T - - - - - - - - - E T H S C S Y L - - - - - -
ACC---------------------------GAAACCCACTCCTGCTCGTACCTG------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R T G L R Y R D E H G K L L Y A H T L N N T G I
- - - - - - - - - - - - - - - A H T L N N T G .
---------------------------------------------GCCCACACCCTCAACAACACCGGC---
385386387388389390391392393394395396397398399400401402403404405406407408
A S P R I L V P L L E N H Q Q A D G T V R V P A
A S P R I L V P - - - - - - - - - - - - - - - -
GCCAGCCCGCGCATTCTGGTGCCG------------------------------------------------
409410411412413414415416417418419420421422423424425
A L R P Y L G G R E V L G Q P V R
- - - - - - - - - - - - - - - - -
---------------------------------------------------
Class II
Bacteria/Staphylococcus aureus/amino acid sequences/Saureus_ser_aa
Bacteria/Staphylococcus aureus/nucleotide sequences/Saureus_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D I R L F R N E P D T V K S K I E L R G D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P K V V D E I L E L D E Q R R K L I S A T E E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K A R R N K V S E E I A L K K R N K E N A D D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I A E M R T L G D D I K E K D S Q L N E I D S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
M T G I L C R I P N L I S D D V P Q G E S D E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N V E V K K W G T P R E F S F E P K A H W D I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E E L K M A D F D R A A K V S G A R F V Y L T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E G A Q L E R A L M N Y M I T K H T T Q H G Y T
- - - - L E R A L M N Y M I T K H T T Q . G Y T
------------TTAGAGCGTGCTTTAATGAACTATATGATTACAAAACATACAACACAA---GGTTATACA
193194195196197198199200201202203204205206207208209210211212213214215216
E M M V P Q L V N A D T M Y G T G Q L P K F E E
E M M V P Q L V - - - - - - - - - - - - - - - -
GAAATGATGGTACCACAGCTTGTA------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D L F K V E K E G L Y T I P T A E V P L T N F Y
- - - - - - - - - - Y T I P T A E V P L T - - -
------------------------------TATACAATTCCAACTGCTGAAGTACCATTAACG---------
241242243244245246247248249250251252253254255256257258259260261262263264
R N E I I Q P G V L P E K F T G Q S A C F R S E
- - - - - - - - - - - E K F T G Q S A C F R S -
---------------------------------GAAAAATTCACTGGTCAATCTGCATGTTTCCGTAGT---
265266267268269270271272273274275276277278279280281282283284285286287288
A G S A G R D T R G L I R L H Q F D K V E M V R
- - - - - - - - - - - - - - H Q F D K V E M V R
------------------------------------------CATCAATTCGATAAAGTGGAAATGGTACGT
289290291292293294295296297298299300301302303304305306307308309310311312
F E Q P E D S W N A L E E M T T N A E A I L E E
F - - - - - - - - - L E E M T T N A E A I L E -
TTT---------------------------TTAGAAGAAATGACAACAAACGCAGAAGCAATTTTAGAA---
313314315316317318319320321322323324325326327328329330331332333334335336
L G L P Y R R V I L C T G D I G F S A S K T Y D
- - - - - - - - - - - - - - - - - - - - - T Y D
---------------------------------------------------------------ACATATGAT
337338339340341342343344345346347348349350351352353354355356357358359360
L E V W L P S Y N D Y K E I S S C S N C T D F Q
L E V - - - - - - - - - E I S S C S N C - - - -
TTAGAAGTT---------------------------GAAATTAGTTCATGCTCAAACTGT------------
361362363364365366367368369370371372373374375376377378379380381382383384
A R R A N I R F K R D K A A K P E L A H T L N G
- - - - - - - - - - - - - - - - - - A H T L N G
------------------------------------------------------GCACATACATTAAATGGT
385386387388389390391392393394395396397398399400401402403404405406407408
S G L A V G R T F A A I V E N Y Q N E D G T V T
S G . A V G R T F A A - - - - - - - - - - - - -
AGTGGT---GCAGTTGGACGTACATTTGCTGCT---------------------------------------
409410411412413414415416417418419420421422423424425426427428
I P E A L V P F M G G K T Q I S K P V K
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_ser_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M G L D I Q L F R D P E M A D I V R E S E R R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Y A R P E I V D D I I E I D K R W R R T Q F L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E A S K K M I N T C S K A V G A K K K A K E A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
G D V S E V P A D V M S A A R E G T L D T E K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E S L C I L Q L K Q L S K A L A T Q V E S L A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L A A E Q E A E R D R M V I S V G N V L H E S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P V S N D E E T G N V V V R T F G D V T R R L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
M T H V D C M E R L G L M D T S K A V T A M A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G R A F V L R G G L V Q L Q F A L I S Y A L N F
- - - - - - - - - - - - L Q F A L I S Y A L N F
------------------------------------CTGCAATTCGCCCTCATCTCGTACGCGCTCAACTTC
217218219220221222223224225226227228229230231232233234235236237238239240
L I A R G Y E P F Y P P F F L N K E Y M G A V A
L I A R G Y E P F Y P P F F L - - - - - - - - -
CTCATCGCCCGCGGCTACGAGCCCTTCTACCCGCCCTTCTTCCTC---------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Q L S D F D E S L Y K V S G D G D E K Y L I A T
- - - - - - - - - - - - - - - - - - - Y L I A T
---------------------------------------------------------TACCTGATTGCGACG
265266267268269270271272273274275276277278279280281282283284285286287288
S E A P I A A Y H T N K W F T E M K E P I K Y A
S E A P I A - - - - - - - - - - - - - - I K Y A
AGCGAGGCACCCATTGCC------------------------------------------ATCAAGTACGCC
289290291292293294295296297298299300301302303304305306307308309310311312
G V S S C F R K E A G A H G R D T L G I F R V H
G V S S C F R K - - - - - - - - - - - - - - - H
GGCGTCTCGTCGTGCTTCCGAAAG---------------------------------------------CAC
313314315316317318319320321322323324325326327328329330331332333334335336
Q F D K L E Q F V V C S P R E D Q S W K M L E E
Q F D K L E Q F V V - - - - - - - - - - - L E E
CAGTTCGACAAACTGGAGCAGTTTGTTGTG---------------------------------CTGGAAGAG
337338339340341342343344345346347348349350351352353354355356357358359360
M I Q T S Q D F N E S L G L P Y R V I N I C S G
M I Q T S Q D F N E - - - - - - - - - - - - - -
ATGATCCAGACCTCCCAGGACTTCAACGAG------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
A L N N A A A K K Y D L E A W F P G S G A F R E
- - - - - - - - K Y D L E A - - - - - - - - - E
------------------------AAGTACGACCTGGAGGCG---------------------------GAG
385386387388389390391392393394395396397398399400401402403404405406407408
L V S C S N C T D Y Q A R S V N C R F G P N T K
L V S C S N C - - - - - - - - - - - - - - - - -
CTTGTTTCGTGCTCGAACTGC---------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
G S T A N S T K E Y C H M L N G T L C A V T R T
- - - - - - - - - - C H M L N G T L . A V T R T
------------------------------TGCCACATGCTGAACGGTACTCTC---GCTGTCACTCGCACA
433434435436437438439440441442443444445446447448449450451452453454455456
M C C I C E N Y Q T E E G I L I P E V L R P F M
M C C - - - - - - - - - - - - - - - - - - - - -
ATGTGCTGC---------------------------------------------------------------
457458459460461462463464465466467468469470471472473474
M G T E M L K F P A E A P T A D K E
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_ser_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V L D I N L F R V S K G G N P E K V K E S Q R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
R R Y A S T E I V D K V I E L D K A W V S K D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E A S Q L S K E L N Q L N K D F G A A M K A K S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
P T D E L S K K I A A N K Q E T E R V K K E V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Q L L A E R N A V L N T I G N I V C D A V V V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
N N E D N N K V V Y T N D A V V R A N P S P N G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V E K T L N H V T L M T N C R M M D C P R G V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I S G N R G Y F L T G Y G A L L N Q A L I Q Y A
- - - - - - - - - - - - - - - L N Q A L I Q Y A
---------------------------------------------TGTTTTGATAGAGTTGTACGTTAGCTC
193194195196197198199200201202203204205206207208209210211212213214215216
L K F L T D R G Y Q A M Q T P F F M E Q E A M S
L K F L T D R G Y Q A M Q T P F F M - - - - - -
TGCTATCTGGCCTTGTTTTGAAAAGTTGATAATCTCCCCCATGTGGTATGCGCA------------------
217218219220221222223224225226227228229230231232233234235236237238239240
C C C Q L E D F D E Q L Y K V S G E G N D K Y L
- - - - - - - - - - - - - - - - - - - - - - Y L
------------------------------------------------------------------CTGGCA
241242243244245246247248249250251252253254255256257258259260261262263264
I A T S E Q P L C A Y H M G E I I N F S K Q G Q
I A T S E Q P L C - - - - - - - - - - - - - - -
GCAACATGACATCGCCTCTTGCTCCAT---------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I A E L T Y N S I K T G K Q E K K T L E C I R Y
- - - - - - - - - - - - - - - - - - - - - I R Y
---------------------------------------------------------------TCTGTTGCC
289290291292293294295296297298299300301302303304305306307308309310311312
A G M S T C F R K E V G R H G H D T L G I F R I
A G M S T C F R K - - - - - - - - - - - - - - -
AGATATCTTGACCCCTCTCGGGCAGTC---------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H Q F E K I E Q I V V C K E E D S W D M M E Y M
H Q F E K I E Q I V V - - - - - - - - - M E Y M
TTCGACGCCATTGGGAGAAGGGTTGGCCCTAAC---------------------------ATTATTATCCTC
337338339340341342343344345346347348349350351352353354355356357358359360
I D N C R A F F D S L M I P Y R V V I I V S G A
I D N C R A F F D - - - - - - - - - - - - - - -
ATTATTGTCAACTACGACTGCGTCGCA---------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
L N N A A A M K Y D L E A Y F P G S N T Y R E L
- - - - - - - K Y D L E A - - - - - - - - - E L
---------------------GACCCTTTCTGTCTCTTG---------------------------CTCGTC
385386387388389390391392393394395396397398399400401402403404405406407408
V S C S N C T D Y Q S R S L D I K Y Q D G K D K
V S C S N C - - - - - - - - - - - - - - - - - -
GGTAGGGCTCTTTGCCTT------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K Y V H L L N S T L S A T E R T L C C L V E N Y
- - V H L L N S T L . A T E R T L C C - - - - -
------ATAGTCTTTAGAGACCCAGGCCTT---CAACTCTATGACCTTGTCAACGAT---------------
433434435436437438439440441442443444445446447448449450451452453454455456
Q T P T G I K V P V P L Q S Y V G A D F L P F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457
V
-
---
Class II
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_ser_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L D Q R L V R D N P E I I V T Q L G R R G I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L S L E G L Q L I A Q H Q K S L E S R R S T L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S R A N S I G K Q V S E T I W K G I P F E S P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V N R L R E I G N K I K R Q V S I L E E E E Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F T Y Y L K E Q L L T F P N L P S K S C P N G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
T E V D N V E Q R C W G K P R Q E V N L K N H W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E I A D K L G I I D T E R S V R I A Q S R F V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L I G Q G A K L E R A L I N F M L D F H T K K G
- - - - - - - L E R A L I N F M L D F H T K K G
---------------------AAGATCATCCGCAGCAATAATTTCGTCTCGGTGTAAGGAAGTAATTGGGAC
193194195196197198199200201202203204205206207208209210211212213214215216
Y C E I L P P I L A N T N S L T G S G Q L P K F
Y C E I L P P I L A - - - - - - - - - - - - - -
TTCAGAAGTGGGAATAAGCCATAGGTCATC------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A E E S F R C S E D D L W L I P T S E V P I T S
- - - - - - - - - - - - W L I P T S E V P I T -
------------------------------------AGGAGGAAGAATTTCACAATAGCCCTTCTTGGT---
241242243244245246247248249250251252253254255256257258259260261262263264
L H R D E I I A A D D L P L K Y V A Y S P C F R
- - - - - - - - - - - - - L K Y V A Y S P C F R
---------------------------------------TGCACCTTGACCTATCAAAGTTACAAAGCGGCT
265266267268269270271272273274275276277278279280281282283284285286287288
R E A G S Y G R D T R G L I R L H Q F N K V E L
R - - - - - - - - - - - - - - - H Q F N K V E L
TTG---------------------------------------------TGCTATCTCCCAATGATTTTTAAG
289290291292293294295296297298299300301302303304305306307308309310311312
Y W F S H P D D S D K A H I Q I T A D A E A V L
Y W F - - - - - - - - - H I Q I T A D A E A V L
ATTAACTTC---------------------------TTCTACATTATCAACCTCAGTCTTACCATTAGGGCA
313314315316317318319320321322323324325326327328329330331332333334335336
Q A L E L P Y R V L D L C T G D I G F S A T R T
Q - - - - - - - - - - - - - - - - - - - - - - T
AGA------------------------------------------------------------------TTC
337338339340341342343344345346347348349350351352353354355356357358359360
Y D L E V W L P G A N A Y R E I S S S S N C A D
Y D L E V - - - - - - - - - E I S S S S N C - -
TTCCAGAATACTTAC---------------------------TCTTAACCTATTTACTTCAGGTGA------
361362363364365366367368369370371372373374375376377378379380381382383384
F Q S R R S S I R M K S G K N T Q L V H T L N A
- - - - - - - - - - - - - - - - - - V H T L N A
------------------------------------------------------AGATTGCAAAGTACTACG
385386387388389390391392393394395396397398399400401402403404405406407408
S G L A I G R T M A A L L E T G Q Q N D G T V I
S G . A I G R T M A A - - - - - - - - - - - - -
ACGAGA---TAAACTCTTCTGATGCTGAGCAAT---------------------------------------
409410411412413414415416417418419420421422423424425426
L P A I I A P Y F G R D R L V P E H
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_ser_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I D I N L L R D P K T R E L V I E S E K K R F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K N T D N I E E I Y K K D Q L R I K F N F E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N T N K K K N E I K K K I S Q I Y K E N K K E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K E L A K D L I E K L K L I E K S C F E L E V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
V S T L D E E I K K M L K V V G N I L D S S V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V S N N E R D N K L I R Q F R T N R V I Q N K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N Y T E L M Q K Y T H S V A G A K I I G H R G Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F L S G K I A K L G M A L S R Y A I D F L E K Q
- - - - - - - - L G M A L S R Y A I D F L E K Q
------------------------CAAATCTGAATCAACCATTCGTTCGTCCATGTGTAATGCGCTAAGAGG
193194195196197198199200201202203204205206207208209210211212213214215216
G Y T F I Q T P V M M R K D V M S K T A Q I G D
G Y T F I Q T P V M M - - - - - - - - - - - - -
CTGCTCAGATGTAGCAATGAGATACAAATCATC---------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
F D E Q L Y K V E D D L Y L I A T S E Q P L S A
- - - - - - - - - - - - Y L I A T S E Q P L S -
------------------------------------AGGAGTTTGAATAAAAGTGTAACCTTGTTTTTC---
241242243244245246247248249250251252253254255256257258259260261262263264
L H M D E R M V D S D L P K L Y C G Q S L C F R
- - - - - - - - - - - - - K L Y C G Q S L C F R
---------------------------------------CGCAATTTTACCACTCAAAAAATAACCCCTATG
265266267268269270271272273274275276277278279280281282283284285286287288
K E A G A H G K D N S G I F R V H Q F E K I E Q
K - - - - - - - - - - - - - - - H Q F E K I E Q
CCC---------------------------------------------TTCTGTATAATTTTTTTTATTTTG
289290291292293294295296297298299300301302303304305306307308309310311312
F V I C K P E E S K E Y F Y K M I G L S E E F Y
F V I - - - - - - - - - F Y K M I G L S E E F Y
AATAACTCT---------------------------ATTGTCTCTTTCATTGTTACTTACCACAACAGATGA
313314315316317318319320321322323324325326327328329330331332333334335336
K S L D I S Y N V V S I V S G E F N D A A S I K
K - - - - - - - - - - - - - - - - - - - - - - K
ATC------------------------------------------------------------------CAA
337338339340341342343344345346347348349350351352353354355356357358359360
Y D L E A F F P N A D K Y R E L V S C S N C T D
Y D L E A - - - - - - - - - E L V S C S N C - -
TTCAAAACAGCTTTT---------------------------ATCTTTAGCTAACTCTTTTCCTTC------
361362363364365366367368369370371372373374375376377378379380381382383384
Y Q S R E L N V R Y G V L K E N N K K G Y V H M
- - - - - - - - - - - - - - - - - - - - - V H M
---------------------------------------------------------------AAGTTCAAA
385386387388389390391392393394395396397398399400401402403404405406407408
L N S T L C A V Q R T L C C V V E N Y Q Q D D K
L N S T L . A V Q R T L C C - - - - - - - - - -
ATTAAATTTTATTCT---TTGGTCTTTTTTGTAAATCTCTTC------------------------------
409410411412413414415416417418419420421422423424425426427
I I V P E V L R K Y T G F D E I E L N
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Eukaryotes/Cryptosporidium parvum Iowa II/amino acid sequences/Cparvum_ser_aa
Eukaryotes/Cryptosporidium parvum Iowa II/nucleotide sequences/Cparvum_ser_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P I D I N R I R V E K G G D Y Q K I A E S E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A R Y K G L E T L E E L V K V D Q K W R E D M F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K L E Q S K K E L N S I S K E I A Q I K K K D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K A D C K D L Q D K S V Q L K K N L P I I E K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A L E T E E V R D K L W H K I G N V L Q P D V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I S N T E D D N L V L R T W G E I P D I K V D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
T P G K L H H N E I M S R L G F Y D S V K G A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L A G H R G Y F L K D Y G V I M S M A L S H Y A
- - - - - - - - - - - - - - - M S M A L S H Y A
---------------------------------------------ATGAGTATGGCTCTCTCACATTATGCT
193194195196197198199200201202203204205206207208209210211212213214215216
M G F L L K K G Y L A I Q P P Y F M K R D L M G
M G F L L K K G Y L A I Q P P Y F M - - - - - -
ATGGGATTCTTGTTAAAAAAAGGATATTTGGCAATTCAACCGCCATACTTTATG------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K A A E L Q D F E E T L Y H I P S D N S K G E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
D S N S L F L I A T S E Q P I A A M H H N V T L
- - - - - F L I A T S E Q P I A - - - - - - - -
---------------TTTTTGATTGCAACATCTGAGCAACCAATAGCT------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E D K D L P I K Y A G I S T C F R K E A G A H G
- - - - - - I K Y A G I S T C F R K - - - - - -
------------------ATCAAATATGCTGGTATTTCAACATGCTTTAGAAAA------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K D T W G I F R I H Q F E K V E Q F C V T L P E
- - - - - - - - - H Q F E K V E Q F C V - - - -
---------------------------CATCAATTTGAAAAAGTTGAGCAATTCTGTGTT------------
313314315316317318319320321322323324325326327328329330331332333334335336
D S Q K I H E E M I S I S E E F Y Q S L E L P Y
- - - - - H E E M I S I S E E F Y Q - - - - - -
---------------CATGAGGAAATGATTAGCATTTCCGAGGAATTTTATCAA------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R V I S I V S G A L N D A A S K K Y D L E A W F
- - - - - - - - - - - - - - - - K Y D L E A - -
------------------------------------------------AAGTATGATTTAGAAGCT------
361362363364365366367368369370371372373374375376377378379380381382383384
P G Y N S Y R E L V S C S N C T D Y Q S R A L E
- - - - - - - E L V S C S N C - - - - - - - - -
---------------------GAACTTGTTTCATGCTCAAACTGT---------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
C R L G F R K E G E R E K H Y C H F L N G T L C
- - - - - - - - - - - - - - - C H F L N G T L .
---------------------------------------------TGCCATTTCCTAAACGGTACTTTA---
409410411412413414415416417418419420421422423424425426427428429430431432
A I Q R T M C C I V E N Y Q T P D G L R I P K V
A I Q R T M C C - - - - - - - - - - - - - - - -
GCAATCCAAAGAACAATGTGCTGT------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454
L Q P Y M N G V E F I P F K N E T A T C A N
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Archaea/Methanothermobacter thermautotrophicus/amino acid sequences/Mthermautotrophicus_thr_aa
Archaea/Methanothermobacter thermautotrophicus/nucleotide sequences/Mthermautotrophicus_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I L L I H S D Y L K Y E T K N K T G I A E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I P E D K M Q G D F R E S L V V F T A V E A E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E D N P E S V I E N A V N E I I K V F N D V K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
E N V V I Y P Y A H L S S S L S S P K T A V E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E G M E S A L R S E G V D V S R V P F G W Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
A F K I S C K G H P L S E L S R S I R P Q P P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V E E E S E E S E W F I L H R G E T V K P G D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E F K N R D L E N L V K Y E L G E L E S S G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P P H V R L M R E K G L A D Y E P S A D V G H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R W Y P R G R L I R D L L A D Y V Y M L V T S E
- - - - - - - - I R D L L A D Y V Y M L V T S E
------------------------ATAAGGGACCTTCTTGCAGACTACGTCTACATGCTTGTCACCAGTGAG
241242243244245246247248249250251252253254255256257258259260261262263264
G A M P V E T P I M Y D L E D E A I R V H A E K
G A M P V E T P I M Y - - - - - - - - - - - - -
GGGGCAATGCCAGTTGAGACACCCATAATGTAT---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F G E R Q Y R M K N R K E L M L R Y A C C F G A
- - - - - - - - - - - - - - M L R Y A C C F G A
------------------------------------------ATGCTGAGATACGCCTGCTGTTTCGGAGCC
289290291292293294295296297298299300301302303304305306307308309310311312
F R I L S D S F L T W K N L P A S I Y E L S T Y
F - - - - - - - - - - - - - - A S I Y E L S T .
TTC------------------------------------------GCATCCATATATGAACTCTCGACC---
313314315316317318319320321322323324325326327328329330331332333334335336
S F R L E K K G E V V G L K R L R G F T M P D L
S F R L - - - - - - - - - - - - R G F T M P D L
AGCTTCCGGCTT------------------------------------AGGGGCTTTACAATGCCGGATCTC
337338339340341342343344345346347348349350351352353354355356357358359360
H T V C A D L D Q S L E E F A R Q V E M C M R T
H T V - - - - - - - - - - F A R Q V E M C M R T
CACACGGTA------------------------------TTCGCCAGGCAGGTCGAGATGTGCATGAGGACC
361362363364365366367368369370371372373374375376377378379380381382383384
G Q D L Q V N Y E V I F R A T A D F Y E E Y R E
G Q - - - - - - - - - - - - - - - - - - - - - -
GGCCAG------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
W V H E V A D K I G K P V L L E I L P S R K H Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
W I A K M D F A A I D Y L G R P I E N P T V Q I
- - - K M D F A A - - - - - - - - E N P T V Q I
---------AAGATGGACTTCGCAGCC------------------------GAGAATCCAACAGTTCAGATT
433434435436437438439440441442443444445446447448449450451452453454455456
D V E S G E R F G I T Y V N S D E E E V N P I I
D - - - - - - - - - - - - - - - - - - - - P I I
GAC------------------------------------------------------------CCAATAATC
457458459460461462463464465466467468469470471472473474475476477478479480
L H C S P T G S I E R V I C S L L E K T A I E M
L H C S P . . S I E R V I C S - - - - - - - - -
CTCCACTGCAGTCCA------AGCATTGAGAGGGTCATATGCAGC---------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
D E K P P M L P L W L S P T Q V R V L P I A E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
H M E Y A S D L V S E L I A A D V R A D L D D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S E T L G K K I R N A A Q D W V P Y V V V I G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
S E M E G K L T V N V R E T G E K L Q M G L D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L I E R I R A E T E G M P F R R L P L P V K L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605
E R I N F
- - - - -
---------------
Class II
Archaea/Thermoplasma volcanium/amino acid sequences/Tvolcanium_thr_aa
Archaea/Thermoplasma volcanium/nucleotide sequences/Tvolcanium_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P I N E I R V Q K G Q R Y R D A I N D K K V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A V K K G D K F L D L D E I A G E D E A V Q P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
Y L D S E D G L Y I L R H S A A H L L A N A V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N L F P E A L P N T G P V V E N G F Y Y D F D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K P I T E E D L S K I E E E M K R I V K E N V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I R R M I Y S K D E L L K I F S K N P Y K I R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I N E N V E G K S S V Y Q Q G N F V D L C L G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
H V P S T G Y I K A F K L L S I A S A V Y K Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E S K N L V R I Y G T A F P D E K S L R R Y L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N L E E A K K R D H R K I I A E M D L A V F N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E W A P G F P M Y T P N G Q I I R K E L I K Y M
- - - - - - - - - - - - - - - I R K E L I K Y M
---------------------------------------------GCTTAGATCAAAGGCCATTTCTATGTT
265266267268269270271272273274275276277278279280281282283284285286287288
D Y V N G K N G W T D V W T P H V F K D T I W K
D Y V N G K N G W T D V W T P H V F - - - - - -
TCCGAATACAGTAGTAAAGGTCTCCCTGACCATGCCAAGCAGAGTCTTTATCTC------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q S G H Y A K Y K P N M Y L F V L P D G D S Y G
- - - - - - - - - - - - - - - - - - - - - - - G
---------------------------------------------------------------------CTT
313314315316317318319320321322323324325326327328329330331332333334335336
I K P M N C P G H I A I F A R R K Y S Y R D L P
I K P M N C P G H I - - - - - - - - - - - - - -
CTCGTACCTGTAAACAGTACCCGGCTCTGA------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V K Y S E P G T V Y R Y E K S G E V G G L T R P
V K Y S E P G T V Y R Y - - - - - - - - - - - -
AAATATTGCTATATGGCCCGGGCAGTTCATTGGCTT------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A F T Q D D G H E F I R M D Q I V G E I K T L
R A F T Q D D G H E F - - - - - - - - - I K T L
ATACATGTTCGGTTTGTACTTTGCATAGTGCCC---------------------------CACATGGGGAGT
385386387388389390391392393394395396397398399400401402403404405406407408
L G M V R E T F T T V F G N I E M A F D L S V I
L G M V R E T F T - - - - - - - - - - - - - - -
CCAAACGTCAGTCCAGCCGTTCTTTCC---------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D K E H P E N Y L L S Y V C K D C G N R V E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R G T D I E C P V C H S H N M D P D F S T W D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A T E Q L R Q A M D S M G I T Y K E Y P G E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
F Y G P K I D V H V K D A L G R M W Q L S T I Q
- - - - K I D V H V - - - - - - - - Q L S T I Q
------------CTTTATGTATCCGGTTGA------------------------ATCTACAAAGTTTCCCTG
505506507508509510511512513514515516517518519520521522523524525526527528
V D F F M P I N F G L T Y T N S E G K E E R V V
V D - - - - - - - - - - - - - - - - - - - - V V
CTGGTA------------------------------------------------------------AAAAAT
529530531532533534535536537538539540541542543544545546547548549550551552
I I H R A I Y G S Y E R F M A I L L E H F A G K
I I H R A I . . S Y E R F M A I - - - - - - - -
CTTCAGCAATTCATCTTT------TATCATTCTCCTTATTGGGACATT------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L P T W L T P I Q T Y V I P V G T A N A E Y A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
K V N K S L L D A G I R S V V D D G P D T V S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K I K M I H D Q R P S Y I V V V G A K E E Q D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
T V T V R N R A G K S K T Y G M N E F L E I I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660
N E I E K R S V G Q A F
- - - - - - - - - - - -
------------------------------------
Class II
Archaea/Methanococcus aeolicus Nankai/amino acid sequences/MaeolicusNankai_thr_aa
Archaea/Methanococcus aeolicus Nankai/nucleotide sequences/MaeolicusNankai_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K V L L I H S D Y L E F E A K Q K T K I A E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T D I L N G K M E E C L T V F M A V E K E D E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N P Q N V I Y N T V D E I I K T A E N L K I N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V V V Y P Y A H L S S E L S S P K V A K E V L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K I E E E L K Q K N Y S V L R A P F G W Y K S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K I S C K G H P L S E L S R K I T T E R K E E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G E T E A K D R P K N K F Y I L D G E K G E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L K E L D E K K V K K L K D K G L K S V A M H E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
M G I K H G G K E K D I E P P H V K F I T E K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I C D Y E P S S D A G H F R W Y P K G K L I R D
- - - - - - - - - - - - - - - - - - - - - I R D
---------------------------------------------------------------TTCAAAGAA
241242243244245246247248249250251252253254255256257258259260261262263264
L L Q D Y V Y N M V V E N N G M P V E T P V M Y
L L Q D Y V Y N M V V E N N G M P V E T P V M Y
ATCCTCTGTAAATCTAAATATTGTAGAATATGGCGTATTAAGGTCATCTCCTGTTTTTAAGCACATCCAGAA
265266267268269270271272273274275276277278279280281282283284285286287288
D L G N K A I K E H A D K F G E R Q Y R F K Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
N K D L M L R F A A C F G Q F M M K K D M Y I L
- - - - M L R F A A C F G Q F - - - - - - - - -
------------TAATCCTACGAGCTCCCCTCTTTGTTCATATCT---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P K H L P L K L Y E L S T Y S F R Y E Q R G E L
- - - - - L K L Y E L S T . S F R Y - - - - - -
---------------TTTTGGAAGTATGTACATATCCTT---CATCATAAATTG------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V G L K R L R G F T M P D M H T V C K D T K Q T
- - - - - - R G F T M P D M H T V - - - - - - -
------------------GTTTCCCTGTTTAAATCTGTACTGTCTTTCTCC---------------------
361362363364365366367368369370371372373374375376377378379380381382383384
I E E F E N Q F W M C L K T G D D L N T P Y S T
- - - F E N Q F W M C L K T G D - - - - - - - -
---------ATTTCCCAAATCATACATTACAGGTGTTTCAACAGGCAT------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I F R F T E D F F E E N K E W F F K V A K E Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E K Y G K D V I L E L I P E R K H Y W V G K V D
- - - - - - - - - - - - - - - - - - - - - K V D
---------------------------------------------------------------CTTTTCTTT
433434435436437438439440441442443444445446447448449450451452453454455456
M A V I D S F G R P I E N P T V Q I D V E S A K
M A V - - - - - - - - E N P T V Q I D - - - - -
ACCTCCATG------------------------TACGGATTTTAAACCTTTATCTTT---------------
457458459460461462463464465466467468469470471472473474475476477478479480
R F N I V V H D G N E K T Y P V I L H C S P T G
- - - - - - - - - - - - - - P V I L H C S P . .
------------------------------------------ATCAAGGATGTAGAATTTATTTTT------
481482483484485486487488489490491492493494495496497498499500501502503504
S I E R V L C G L L E K A S L D A D A G A P P M
S I E R V L C G - - - - - - - - - - - - - - - -
GTCTTTTGCCTCCGTTTCTCCTTT------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L P V W L S P I Q A R V I P V A D A H S E Y A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S V A K K L R E N G I R A D F D D R E E S V G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K I R N A G K D W V P F V I V I G D K E V E N N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I L T T T I R E K S T L K K P V K E N L T V E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L I E K I K E E T K G F P Y R P L S L P L Y C S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630
L Q P I F R
- - - - - -
------------------
Class II
Archaea/Sulfolobus acidocaldarius/amino acid sequences/Sacidocaldarius_thr_aa
Archaea/Sulfolobus acidocaldarius/nucleotide sequences/Sacidocaldarius_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E S Y K E V W L K A G L I Y A L N L L S S G N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L K P V E I G L G E R Y F Y V D I D S P D I L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
L D E A K D F A K Y N Q Y D Y Q L V E D N Q G S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I T V V Y N G H Q I R L N G G K P N Q N V H P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y F Q I L S I S V H H P S P E K Q Y V R V L G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G F E K E E Q L K D Y L N W L E K V S E Y D H R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I I G D R L D L F S F P E E A P P G V V L F H P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N G Q I I R K E M M R F M E E I N D S M G Y K E
- - - - I R K E M M R F M E E I N D S M G Y K E
------------GGATAAACTATCTCTGATGTCGAAATCTATTTTAGGACCATAAAATGCCCCCTCTTTTTC
193194195196197198199200201202203204205206207208209210211212213214215216
V Y T S H V Y R S L L W K I S G H Y D Y Y K D K
V Y T S H V Y - - - - - - - - - - - - - - - - -
TTTGACTTCATACCTAATGTT---------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
M L L F E I D N D E E L G I K P M N C P A H I L
- - - - - - - - - - - - G I K P M N C P A H I -
------------------------------------ATTTACTCTGACATCATCTCCCTTGAAACCAAA---
241242243244245246247248249250251252253254255256257258259260261262263264
I Y K S K V R S Y K D L P I R F S E F G H V Y R
- - - - - - - - - - - - - I R F S E F G H V Y R
---------------------------------------TTCGTCCTTAATTTGATCTTCTCTAAGAAAGAT
265266267268269270271272273274275276277278279280281282283284285286287288
W E K K G E L Y G L L R V R G F T Q D D G H I F
W - - - - - - - - - - - - R G F T Q D D G H I F
ATG------------------------------------ACCATACAATTCACCTTTCTTCTCCCACCTATA
289290291292293294295296297298299300301302303304305306307308309310311312
L R E D Q I K D E I K L L M K K T L D V L A I F
- - - - - - - - - I K L L M K K T L D V L A - -
---------------------------AGGTAAATCCTTATAACTTCTGACCTTACTCTTGTAAAT------
313314315316317318319320321322323324325326327328329330331332333334335336
G F K G D D V R V N L S T R P D E S I G T D E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
W N K A T D A L I S A L N E L N I R Y E V K E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E G A F Y G P K I D F D I R D S L S R W W Q L S
- - - - - - - K I D F D I - - - - - - - - Q L S
---------------------CTCTTCCATGAATCTCAT------------------------ATTTGGATG
385386387388389390391392393394395396397398399400401402403404405406407408
T I Q V D F N L P E R F K L E Y V D K D G S K K
T I Q V D - - - - - - - - - - - - - - - - - - -
AAACAGAACAACTCC---------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
R P V M V H R A I Y G S I D R F M A I L L E H F
- P V M V H R A I . . S I D R F M A I - - - - -
---GTATTCTGATACTTTCTCTAACCA------ATAATCCTTTAATTGTTCCTCCTT---------------
433434435436437438439440441442443444445446447448449450451452453454455456
R G K L P T W L S P I Q V R V L P I T D E I E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
Y G N S L M S R L R E S K I R V D M D S G E E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L S K R I K K A Y D D G V P Y L I I V G R K E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D E G K V T V R A R G N I E I R G I N V E K F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549
Q A L V E E I R N K D L N Q S A V S K L K
- - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------
Class II
Archaea/Methanopyrus kandleri/amino acid sequences/Mkandleri_thr_aa
Archaea/Methanopyrus kandleri/nucleotide sequences/Mkandleri_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R L L F I H A D E M S F E A R Q K T K I A E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E P P I K E A E V E D C L V V F A A V Q E A D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E N P K A I A E A A V E E I E D V A G E L K A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R I V L Y P Y A H L A D D L A S P D V A V E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K R M E G L L K E R G Y E V V R A P F G W Y K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F R L A C K G H P L S E L S R T V T P E A A E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A E E E K I E S E F L V Y M D G E L I P V E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D L S E L P E D F R H L V M H E L G E E R E T G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
D E E P A H V K L M R E K E I C D H E P A A D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G H V R W Y P K G H V V R R C L A E Y V E N L M
- - - - - - - - - - - V R R C L A E Y V E N L M
---------------------------------GTCAGGAGATGCCTGGCGGAGTACGTGGAGAACCTCATG
241242243244245246247248249250251252253254255256257258259260261262263264
A D L G A A V V E T P V M Y D L S E D A I R E H
A D L G A A V V E T P V M Y - - - - - - - - - -
GCCGATCTAGGAGCGGCGGTCGTCGAGACACCCGTGATGTAC------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A D K F G E R Q Y R I R A G N R A L M L R Y A A
- - - - - - - - - - - - - - - - - - M L R Y A A
------------------------------------------------------ATGCTGAGGTACGCGGCC
289290291292293294295296297298299300301302303304305306307308309310311312
C F G A F R L L A D T T L S R R H L P L K I Y E
C F G A F - - - - - - - - - - - - - - L K I Y E
TGCTTCGGAGCCTTC------------------------------------------TTGAAGATCTACGAA
313314315316317318319320321322323324325326327328329330331332333334335336
L S Q S F R L E Q S G E V V G L K R L R A F T M
L S Q S F R L - - - - - - - - - - - - R A F T M
CTATCACAAAGCTTCAGGTTA------------------------------------CGGGCGTTCACTATG
337338339340341342343344345346347348349350351352353354355356357358359360
P D L H T V C A D M D E A V E E F L E Q A K L C
P D L H T V - - - - - - - - - - F L E Q A K L C
CCCGATCTCCACACCGTT------------------------------TTCCTCGAGCAAGCGAAACTATGC
361362363364365366367368369370371372373374375376377378379380381382383384
L E V G L D L G L E Y E V V F R T T E K F L K E
L E V G L - - - - - - - - - - - - - - - - - - -
TTGGAGGTAGGGCTG---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R K E V L E E L A E A M E K A Y G D A K P V L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E V L P E R K H Y W E C K V D F A F I D S L G R
- - - - - - - - - - - - K V D F A F - - - - - -
------------------------------------AAGGTGGACTTCGCGTTC------------------
433434435436437438439440441442443444445446447448449450451452453454455456
P I E N P T V Q I D V E S G R R F G I T Y A D E
- - E N P T V Q I D - - - - - - - - - - - - - -
------GAGAACCCGACGGTACAGATCGAC------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
S G D E R H P V I L H C S P T G S L E R V I C A
- - - - - - P V I L H C S P . . S L E R V I C A
------------------CCAGTGATATTACACTGCTCACCG------AGCCTTGAACGTGTAATATGCGCG
481482483484485486487488489490491492493494495496497498499500501502503504
I L E G Q Y K R F E Q E G K L P T L P T W L S P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V Q A R V I P V S E K V L E E A E K V F E E L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S E G F R V D L D D R D E P V G R K I R D A G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E W V P Y V I V I G E E E V K K G T L S V T I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E E S T L K E Q R R E E M T L E E L V E R L E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E T E G K P R V P L T I P D R L S R R P R F G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Archaea/Methanospirillum hungatei/amino acid sequences/Mhungatei_thr_aa
Archaea/Methanospirillum hungatei/nucleotide sequences/Mhungatei_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R L L L I H S D F I E Y E A K K K T K F A E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P C N P A D R L D D A L V A F C A V E S P D A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D I D D V I C Q T V T A I G E M A G K V E C N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V M V Y P Y A H L S S D L A A P D L A V A A L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A I E E S L E K A G Y E V K R A P F G W Y K S F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S L S C K G H P L S E L S R S I T P S E D A V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P E K K H I E H K F F V L T P E G T I H D V Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Y M D D S P F A A L I K K E I G T A V P V G G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P V H V D L M R S K E F V D Y E P V S D V G H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R W L P R G K L V R D L L A D Y A L S L V L D Y
- - - - - - - - V R D L L A D Y A L S L V L D Y
------------------------GATCCAGCCTTCATACTCTGAATAGAATTCCTCAGTGCAGCGGAATAC
241242243244245246247248249250251252253254255256257258259260261262263264
G A S P V E T P V M Y D L A D K A I F E H A D K
G A S P V E T P V M Y - - - - - - - - - - - - -
TGCAACCAGCTGGGTCCCGAAGTCACGCCCGGT---------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
F G E R Q Y R F K S G N R N M M L R F A A C F G
- - - - - - - - - - - - - - - M L R F A A C F G
---------------------------------------------AAAAGCACGAAGTCTTTTCAGACCAAT
289290291292293294295296297298299300301302303304305306307308309310311312
M F T T M R S M H I S P N H L P M K M Y E L S T
M F - - - - - - - - - - - - - - M K M Y E L S T
AACCTC------------------------------------------CATCTTCATCGGCAGATGGTTTGG
313314315316317318319320321322323324325326327328329330331332333334335336
Y S F R H E Q K G E V I G L K R L R A F T M P D
. S F R H - - - - - - - - - - - - R A F T M P D
---GATATGCATACT------------------------------------TCGGAGCATCATGTTGCGGTT
337338339340341342343344345346347348349350351352353354355356357358359360
M H S L C K D L E N A L T C F E E Q L A I G W K
M H S L - - - - - - - - - - F E E Q L A I G W K
ACCTGATTTGAA------------------------------GTGTTCAAAGATGGCTTTATCAGCAAGATC
361362363364365366367368369370371372373374375376377378379380381382383384
T G R D F G T Q L V A V F R C T E E F Y S E Y E
T G R - - - - - - - - - - - - - - - - - - - - -
ATACATGAC---------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
G W I K K I V K D S G V P I L I E T L S D R V H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y W I A K I D L A A I D G Q N R P I E N P T V Q
- - - - K I D L A A - - - - - - - - E N P T V Q
------------CATCAGATCAACATGGAC------------------------GGTCCCGATCTCCTTTTT
433434435436437438439440441442443444445446447448449450451452453454455456
I D V E S S K R F G I K Y H L A D G T E V Y P P
I D - - - - - - - - - - - - - - - - - - - - P P
TATAAG------------------------------------------------------------AAGAAC
457458459460461462463464465466467468469470471472473474475476477478479480
I L H C S P T G S V E R V F C A I L E N T V N Q
I L H C S P . . S V E R V F C A - - - - - - - -
AAAGAATTTATGTTCAAT------CTTCTCAGGTTTTACCGCATCTTC------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
K V A H L P T W L T P T Q V R I I P V T D N H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
G Y A K D I A E K L T K A R I R A D I D D R D D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S L N K K I R A A G M D W V S Y V I V V G D S E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
M N S G N L T V T V R S E S E P N K P Q K I T C
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
T A E K L I E M I G K E T S G K P F R P L Y T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610
R M L S L K P R Y I
- - - - - - - - - -
------------------------------
Class II
Archaea/Archaeoglobus fulgidus/amino acid sequences/thr_Arc_A_fulgidus
Archaea/Archaeoglobus fulgidus/nucleotide sequences/Afulgidus_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K L L L I H A D Y M E Y E V K K K T K L A E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
F D G K G E R V E E V L V A F T S V E K G D D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N V V R K A A E A I R E V A E K V N A E R I M I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y P Y A H L S S N L A D A E T A V K L L K Q L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E L S D F E V H R S P F G W Y K A F R I S C K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G H P L S E L S R E I G G E A E A E V T Q A L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D E E E K V V S Y W Y I L T P E K E L V E V E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F D F T G Y E R L R K F V N Y E I A K R R A V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
V T P P H V E Y M R R L E L A D Y E P A S D S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
H I R Y Y P K G R L V K T L L E Q F I T R K C I
- - - - - - - - - - V K T L L E Q F I T R K C I
------------------------------GTGAAAACGCTCCTTGAGCAGTTCATAACGAGAAAGTGCATT
241242243244245246247248249250251252253254255256257258259260261262263264
D Y G A M E V E T P I M Y D R N H P T L R R Y L
D Y G A M E V E T P I M Y - - - - - - - - - - -
GACTATGGCGCCATGGAGGTTGAAACTCCCATCATGTAC---------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E R F P A R Q Y I I K G D K R E F F L R F A A C
- - - - - - - - - - - - - - - - - F L R F A A C
---------------------------------------------------TTTTTGAGGTTTGCCGCTTGC
289290291292293294295296297298299300301302303304305306307308309310311312
F G Q F L M L S N S T I T Y R N L P L K I Y E L
F G Q F - - - - - - - - - - - - - - L K I Y E L
TTCGGTCAGTTT------------------------------------------CTGAAAATCTACGAGCTC
313314315316317318319320321322323324325326327328329330331332333334335336
T R Y S F R K E Q R G E L V G L R R L R A F T M
T R . S F R K - - - - - - - - - - - - R A F T M
ACCCGC---TCCTTCAGGAAG------------------------------------AGAGCCTTTACGATG
337338339340341342343344345346347348349350351352353354355356357358359360
P D M H T V A K D M E Q A K E E F F N Q Y R L S
P D M H T V - - - - - - - - - - F F N Q Y R L S
CCCGATATGCATACGGTG------------------------------TTTTTCAACCAGTACCGCCTGTCG
361362363364365366367368369370371372373374375376377378379380381382383384
V E V L R E I G L E P E D Y E V A V R I T K D F
V E V L R - - - - - - - - - - - - - - - - - - -
GTGGAGGTTCTGAGG---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y E E N R E F V H S L V D I L Q K P I L I E M W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D H R F F Y F V L K F E F N F V D A L D K A S A
- - - - - - - - - K F E F N F - - - - - - - - A
---------------------------AAATTCGAGTTCAACTTT------------------------GCC
433434435436437438439440441442443444445446447448449450451452453454455456
L S T V Q I D V E N A E R Y G I T F V D S D G K
L S T V Q I D - - - - - - - - - - - - - - - - -
CTCTCAACTGTGCAGATTGAT---------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E K H P Y I L H C S V S G A V E R V M Y A L L E
- - - P Y I L H C S V . . A V E R V M Y A - - -
---------CCCTACATTCTGCACTGCTCCGTC------GCGGTGGAGAGGGTGATGTATGCA---------
481482483484485486487488489490491492493494495496497498499500501502503504
K A K F M L D E G M L P M L P V W L S P T Q V R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V I P V S E R F V D A A I K I A D D I A R N G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R V D V D D R N E T L G K K I R D A Q T E W I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y I A V V G E K E I E S G K L A V T V R A E S T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Q K E Q K R V E M S A E E L A K R V R A E C E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619
K P F M P L P L P K L L S L R P S F R
- - - - - - - - - - - - - - - - - - -
---------------------------------------------------------
Class II
Archaea/Pyrobaculum aerophilum/amino acid sequences/Paerophilum_thr_aa
Archaea/Pyrobaculum aerophilum/nucleotide sequences/Paerophilum_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R V L Y I H A E R F N W E P R D P A L D I R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E P T S G N A N N A L V V F T S V E R G D V P D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E N F L R A V A S D I I D V A K K V K A S A I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I Y P Y A H L S S D L A R P Y T A R E V L N K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F E V V K S Q F N G E V L K A P F G Y Y K A F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I K C L G H P L S E L S R S F K P E E G R A D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R A E E R R D Y Y V I I T P N G E E H D P A K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N Y A N Y G D L K A L V E K E V F R K E L G G G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E P K Y L E Y L R K F G F E W E P M S D A G H M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
R Y A P E A T V M M E L V E D Y S Y I V A K S L
- - - - - - - - M M E L V E D Y S Y I V A . . L
------------------------ATGATGGAGCTAGTGGAGGACTATTCCTATATCGTCGCT------CTT
241242243244245246247248249250251252253254255256257258259260261262263264
G I P V F K I R G T N M F K L S E K A I E S H A
G I P V F K I R G T N M F - - - - - - - - - - -
GGCATACCCGTATTTAAAATTAGGGGCACCAATATGTTT---------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
R L F G E R L Y I V E S D T D L I L R Y A A C F
- - - - - - - - - - - - - - - - I L R Y A A C F
------------------------------------------------ATACTTAGATACGCCGCGTGTTTT
289290291292293294295296297298299300301302303304305306307308309310311312
Q Q F A M A K D W V I S Y K H L P F G M L E I A
Q Q F - - - - - - - - - - - - - - F G M L E I A
CAACAATTC------------------------------------------TTTGGAATGCTGGAAATAGCT
313314315316317318319320321322323324325326327328329330331332333334335336
D S Y R H E Q P G E T V L L F R L R R F Y M P D
D S Y R H - - - - - - - - - - - - R R F Y M P D
GATTCATACCGCCAC------------------------------------AGGCGTTTTTATATGCCAGAT
337338339340341342343344345346347348349350351352353354355356357358359360
L H I F T K D L K E A M E V T Y K L H E V I F R
L H I F - - - - - - - - - - T Y K L H E V I F R
CTCCATATTTTC------------------------------ACTTACAAGCTCCACGAAGTAATTTTTAGA
361362363364365366367368369370371372373374375376377378379380381382383384
E I G K L G R T Y V S L Y N V T E G F Y K N H R
E I G - - - - - - - - - - - - - - - - - - - - -
GAAATTGGC---------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D Y L V E L A R R E G K P I L V R V L P G Q K Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
Y W V L N V E F H I V D E L G R P R E I A T F Q
- - - - N V E F H I - - - - - - - - E I A T F Q
------------AACGTGGAGTTCCACATA------------------------GAGATAGCCACTTTCCAA
433434435436437438439440441442443444445446447448449450451452453454455456
I D V G N A Q R F G I K Y V D E N N Q I K Y P V
I D - - - - - - - - - - - - - - - - - - - - P V
ATAGAC------------------------------------------------------------CCAGTT
457458459460461462463464465466467468469470471472473474475476477478479480
I I H T A I L G S V E R Y L Y A V F D T M A K M
I I H T A I . . S V E R Y L Y A - - - - - - - -
ATAATCCACACGGCAATT------AGCGTGGAGAGATACCTCTACGCC------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E K E G K V P R L P T W L S P V Q V R V I P V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K E N L K Y A I S I A D V L E A E G I R V D I D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
D R E E T L S K K I R D A E T S W I P Y I V V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
G S K E E A E G V I A V R E R G G G Q Y K I R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E E L V K K L K D E T R G Y P Q R P L Y L P R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608
L S Q R P S R F
- - - - - - - -
------------------------
Class II
Archaea/Thermoplasma acidophilum/amino acid sequences/Tacidophilum_thr_aa
Archaea/Thermoplasma acidophilum/nucleotide sequences/Tacidophilum_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P D S I V H V K K G Q R F L D V I K D K N V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A V K I D S V L H D L R D V A E R D V D A I P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
S V Y S D D G L Y I L R H S A A H L L A N A V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N L Y P D A L P N T G P V V E N G F Y Y D F D M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K P I G E E D L A K I E D E M R R I Q K E N V P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I E R I V Y Q K A D L L R I F A K N P Y K I R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I E D N V S D A S S V Y R Q G N F V D L C L G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
H V P S T G Y I K A F K L L N I A S A V Y K H D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E S K T L V R I Y G T A F P D E K L L K Q Y L N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N L E E A K R R D H R R I I A E M D L A V F N S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E W A P G F P L Y T Q Y G Q T I R K E L L S Y M
- - - - - - - - - - - - - - - I R K E L L S Y M
---------------------------------------------GCTAAGATCGAAGGACAGTTCGATGTT
265266267268269270271272273274275276277278279280281282283284285286287288
D S M N R K N G W F D V W T P H V F R D T I W K
D S M N R K N G W F D V W T P H V F - - - - - -
TCCGAATAAAATGGTGAATACATCCTTGACCATGGTCAGCAGGGTTCTTATCTC------------------
289290291292293294295296297298299300301302303304305306307308309310311312
Q S G H Y A K Y R P N M Y L F T L P D G D S Y G
- - - - - - - - - - - - - - - - - - - - - - - G
---------------------------------------------------------------------TTT
313314315316317318319320321322323324325326327328329330331332333334335336
I K P M N C P G H I A I F S R R K Y S Y R D L P
I K P M N C P G H I - - - - - - - - - - - - - -
TTCGTATCTGTACACGGTTCCAGGCTCGGA------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
V R Y S E P G T V Y R Y E K S G E V G G L T R P
V R Y S E P G T V Y R Y - - - - - - - - - - - -
AAAGATGGCTATGTGGCCAGGGCAGTTCATCGGTTT------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R A F T Q D D G H A F L R M D Q I G D E I R T L
R A F T Q D D G H A F - - - - - - - - - I R T L
GTACATGTTTGGCCGGTACTTGGCATAATGCCC---------------------------GACGTGCGGAGT
385386387388389390391392393394395396397398399400401402403404405406407408
L T M V K D V F T I L F G N I E L S F D L S V I
L T M V K D V F T - - - - - - - - - - - - - - -
CCAGACGTCAAACCATCCATTCTTCCT---------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D R D H P E N Y L V S Y V C R N C G Y R I E G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R G T D I E C P V C H S H D L E P D L S V W D N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A T E Q L R D A L K S M G I E Y K E Y P G E A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
F Y G P K I D V H V K D A I G R M W Q L S T I Q
- - - - K I D V H V - - - - - - - - Q L S T I Q
------------TTTTATATAACCGGTGCT------------------------GTCGACGAAGTTGCCCTG
505506507508509510511512513514515516517518519520521522523524525526527528
L D F F M P V N F G L T Y T N S E G K E D R V V
L D - - - - - - - - - - - - - - - - - - - - V V
CCTGTA------------------------------------------------------------AAATAT
529530531532533534535536537538539540541542543544545546547548549550551552
M I H R A I Y G S Y E R V M A I L L E H Y A G K
M I H R A I . . S Y E R V M A I - - - - - - - -
CCTAAGGAGATCAGCCTT------CACTATCCTCTCTATGGGCACGTT------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L P T W L T P I Q T Y V V P I S S N F D E Y A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
H V H E E L I R H G I R S E I D T S Q E T V S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K I K L I H P Y R P A Y I I V V G S K E M E T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S V T A R N R E G K S K T Y S L S E F I D V V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660
K E I E Q R K V D Q A F
- - - - - - - - - - - -
------------------------------------
Class II
Archaea/Pyrodictium occultum/amino acid sequences/Poccultum_thr_aa
Archaea/Pyrodictium occultum/nucleotide sequences/Poccultum_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R V I L I H A K E F Y Y K A R S K A I A E A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P P E S A P Q E A S A E N A L V A F T T V E D I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D T Q G I N E A V E K A A A D I V N V A E K V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A S T I V L Y P Y A H L S Q K L A P P K A A I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A M R L L E D M V R S R A S G K F R V I R A P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G W Y K E F R I H C Y G H P L S E L S R T Y T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K A S K K P H V E K K Y Y V L T P E G D V Y E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E E Y L E K A D E E L R I L I E K E A L G K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G E V E N P V N K L C A K F G F E W E P M S D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G H M R Y E P H A A L M I E A V S E Y A W K L A
- - - - - - - - - - - M I E A V S E Y A W K L A
---------------------------------ATGATAGAGGCTGTGTCGGAGTACGCGTGGAAGCTGGCA
241242243244245246247248249250251252253254255256257258259260261262263264
R G L G I P V L R I R G T N M F D L A A R P V Y
. . L G I P V L R I R G T N M F - - - - - - - -
------CTGGGTATCCCCGTGCTTCGAATACGTGGCACAAACATGTTC------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E H A A L F G D R L Y E L W A D K K H L V M R Y
- - - - - - - - - - - - - - - - - - - - V M R Y
------------------------------------------------------------GTCATGCGCTAC
289290291292293294295296297298299300301302303304305306307308309310311312
A A C H Q Q F A M L K D Y V L S Y K D L P L G M
A A C H Q Q F - - - - - - - - - - - - - - L G M
GCTGCATGCCACCAGCAGTTC------------------------------------------CTAGGCATG
313314315316317318319320321322323324325326327328329330331332333334335336
F E V A D S Y R F E Q S G E V T L C F R L R K F
F E V A D S Y R F - - - - - - - - - - - - R K F
TTCGAGGTAGCTGATAGCTACCGGTTC------------------------------------CGCAAATTC
337338339340341342343344345346347348349350351352353354355356357358359360
Y M P D L H I L T R D V E E A V K V S E K L Q E
Y M P D L H I L - - - - - - - - - - S E K L Q E
TACATGCCCGACCTACATATATTG------------------------------AGCGAGAAGCTGCAGGAA
361362363364365366367368369370371372373374375376377378379380381382383384
V I H R E A A K L G R K Y Y A V Y N V T E D F W
V I H R E A A - - - - - - - - - - - - - - - - -
GTGATACACCGTGAGGCAGCC---------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
S Q K R D L L L E L V R R D G R P A V V A L Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A G I Y Y W V V N V E Y H I V D S V G R P R E I
- - - - - - - - N V E Y H I - - - - - - - - E I
------------------------AACGTCGAGTACCATATA------------------------GAGATA
433434435436437438439440441442443444445446447448449450451452453454455456
A T F Q F D I G N A K R F G I K Y V D E N N Q E
A T F Q F D - - - - - - - - - - - - - - - - - -
GCAACGTTCCAGTTCGAC------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R Y P V I I H T A L I G S V E R Y I Y M V F D T
- - P V I I H T A L . . S V E R Y I Y M - - - -
------CCTGTAATAATCCATACCGCCTTG------TCTGTAGAGAGATACATCTACATG------------
481482483484485486487488489490491492493494495496497498499500501502503504
A V Q M E Q Q G K R P Y I P T W L A P I Q V R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I P V D P K S E D Q I A L A S K V A D M L E H N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L I R V D I D D R D I S L G K R I R D A A R E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I P Y I G V I G D R E V K T G T I N V T I R R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N D R V A L K P E E L L D M V L K D I E D Y P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
V Q S T L P R Y V S K R P S L V Y L E R S L E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629
E P G K G
- - - - -
---------------
Class II
Archaea/Staphylothermus marinus/Smarinus_thr_aa
Archaea/Staphylothermus marinus/Smarinus_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I L T I H A R K F H Y K A L S Q A L D K P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E L T N E N K E G F F E N V L V V F T S V E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D N E K V V E K A V T E I L D I A N R V K P K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I L L Y P Y A H L S S D L A S P S Q A L E I M K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L L E Q K L R G K T D L E V Y R A P F G W Y K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F M L D C Y G H P L S E L S K T I R I T G G G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
V V R R E L K K E F Y I L T P D G K V Y D P E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F N Y D K Y P D L K I L V D K E V F G K E L P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G V N R V N D Y C R K F G F E W E P M S D H G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
M R Y G P H A V I I M E S I M Q Y S W N I V R S
- - - - - - - - - I M E S I M Q Y S W N I V . .
---------------------------ATAATGGAGTCTATTATGCAGTATTCATGGAATATTGTG------
241242243244245246247248249250251252253254255256257258259260261262263264
L G I P V Y K V M G T N M F N L S E K P V L E H
L G I P V Y K V M G T N M F - - - - - - - - - -
CTAGGAATACCAGTTTACAAGGTTATGGGTACTAATATGTTC------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
A L L F G D R L Y E L K V D N E K F V L R Y A A
- - - - - - - - - - - - - - - - - - V L R Y A A
------------------------------------------------------GTATTAAGATATGCTGCT
289290291292293294295296297298299300301302303304305306307308309310311312
C H Q Q F A M L R D W I I S Y K N L P F G M F E
C H Q Q F - - - - - - - - - - - - - - F G M F E
TGTCATCAACAATTC------------------------------------------TTTGGAATGTTTGAA
313314315316317318319320321322323324325326327328329330331332333334335336
V A D S Y R L E Q R G E L N L C F R L R K F Y M
V A D S Y R L - - - - - - - - - - - - R K F Y M
GTAGCTGATAGTTATCGTCTT------------------------------------AGAAAATTCTATATG
337338339340341342343344345346347348349350351352353354355356357358359360
P D L H I L N R D L N E A I K I S R I V Q D K I
P D L H I L - - - - - - - - - - S R I V Q D K I
CCCGATCTACATATCTTG------------------------------TCACGTATAGTGCAGGATAAGATT
361362363364365366367368369370371372373374375376377378379380381382383384
L E E I A K I G R K Y V A L Y N V T S D F F D K
L E E I A - - - - - - - - - - - - - - - - - - -
CTCGAAGAAATAGCT---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y R D I L I E F V R R E N Y P V L V S V I P S G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I Y Y W V L N V E Y H I I D N L N R P R E I A T
- - - - - - N V E Y H I - - - - - - - - E I A T
------------------AACGTTGAATACCATATT------------------------GAGATTGCAACG
433434435436437438439440441442443444445446447448449450451452453454455456
F Q I D I G N G E R F N I T Y T D E K G E K H H
F Q I D - - - - - - - - - - - - - - - - - - - -
TTTCAGATAGAT------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
P V I I H T A I I G G I E R F I Y T I F D T A A
P V I I H T A I . . G I E R F I Y T - - - - - -
CCAGTAATCATACATACAGCAATT------GGTATTGAGAGGTTCATATATACA------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L M E K E G K T P Y I P T W L A P V Q V R I I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I K N E Y L D Y A E K V A E K I E N A G F R V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I D D R G E S L G K K I R D A G R E W I P Y I V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V I G E R E V R S N T I N V R I R R T N D Q K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
M V T D E L I R I L E E E T K N Y P R V S L T M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614
P K Y L S K R P I P S Y H A
- - - - - - - - - - - - - -
------------------------------------------
Class II
Archaea/Pyrodictium delaneyi/amino acid sequences/Pdelaneyi_thr_aa
Archaea/Pyrodictium delaneyi/nucleotide sequences/Pdelaneyi_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I L L I H A K E F S F K A K S K A I A D A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S V D L T P S E A S V E N A L V V F T T V E D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D T Q N L R E V V E N A V K D I I D V A E K V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A Y T I V I Y P Y A H L S K R L A P P K V A K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A L S L L E E E L K K R A E G K Y K V V R A P F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G W Y K E F K I H C Y G H P L S E L S R A Y A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K A S S K P Q I E K K Y F V L T P N G E V Y K P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
E E Y L S K A D E E F R I L I E K E A L G K E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G E V E N P V N A L C A K F G F E W E P F S D Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G H M R Y E P H A T L M V D A V S E Y A W K L A
- - - - - - - - - - - M V D A V S E Y A W K L A
---------------------------------CGTCACTATGGCTGGTTTTCCGTCACGTTTTATTAACTC
241242243244245246247248249250251252253254255256257258259260261262263264
R D L G I P V L R I R G T N M F D L S A K P V Y
. . L G I P V L R I R G T N M F - - - - - - - -
------TAGATCGCGCTTCTCTTGCCAGAAGTCCTCAGTCACATTGTA------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E H A E L F G D R L Y E L W T D R K H L V M R Y
- - - - - - - - - - - - - - - - - - - - V M R Y
------------------------------------------------------------TATATCACGTGT
289290291292293294295296297298299300301302303304305306307308309310311312
A A C H Q Q F A I L R D Y V L S Y K D L P L G M
A A C H Q Q F - - - - - - - - - - - - - - L G M
TAGTATGTGTAGGTCGGGCAT------------------------------------------TTGCTCTAG
313314315316317318319320321322323324325326327328329330331332333334335336
F E I A D S Y R L E Q S G E V T L C F R L R R F
F E I A D S Y R L - - - - - - - - - - - - R R F
ACGGTAACTATCCGCGATCTCGAACAT------------------------------------ACGCAATAT
337338339340341342343344345346347348349350351352353354355356357358359360
Y M P D L H I L T R D I E E A V N V S R K L Q E
Y M P D L H I L - - - - - - - - - - S R K L Q E
TGCAAACTGTTGATGACAAGCAGC------------------------------CCATAGCTCGTATAGACG
361362363364365366367368369370371372373374375376377378379380381382383384
V I H R E A T R L G Q K Y Y A V Y N V T E D F W
V I H R E A T - - - - - - - - - - - - - - - - -
GTCCCCGAAGAGTTCAGCGTG---------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Q E K R D L L L E L I K R D G K P A I V T V Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A G I Y Y W V V N V E Y H I I D V A G R P R E I
- - - - - - - - N V E Y H I - - - - - - - - E I
------------------------GTAGTCTGAGAAGGGTTC------------------------GAGAGC
433434435436437438439440441442443444445446447448449450451452453454455456
A T F Q F D V G N A K R F G I K Y I D E N N V E
A T F Q F D - - - - - - - - - - - - - - - - - -
ATTGACTGGATTCTCTAC------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R Y P V I I H T A L I G S I E R Y I Y M V L D S
- - P V I I H T A L . . S I E R Y I Y M - - - -
------TTTTGATAAATATTCTTCGGGCTT------TTCGCCATTAGGCGTTAGTACGAA------------
481482483484485486487488489490491492493494495496497498499500501502503504
A V K M E R Q G K K P Y I P T W M A P I Q V R L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I P V D P K S E K Q M Q L V E K T A S L L E E N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L I R V D I D D R D I S L G K R I R D A A R E W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I P Y I G V V G D R E V E T G T I N V T I R R S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N D R I A V K P E E L V A M V L E E I R D Y P R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L Q P T L P R Y V S K R P S F V Y L E K P S T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631
K Q D R A K H
- - - - - - -
---------------------
Class II
Archaea/Nanoarchaeum equitans/amino acid sequences/Nequitans_thr_aa
Archaea/Nanoarchaeum equitans/nucleotide sequences/Nequitans_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R A L F L H S N R I K V I A R Q K A L K E A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q L E K P E F D V N K E H L A V F V A V E H G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
N L S V A E Q L V E E I K K V L E K I G I K E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V V V L Y P Y V H L T N N P S S P K L A K E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
D K A Y D L L K S E G F E V Y K A P F G W Y K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F E I H V K G H P L A E L S R T I K P K K V K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E E G N K V Y L I Y D G E K E Y I I V G K K D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I L V K D Y K E I E N K E K L H F E L P K D G I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E L P I P I N Q D F E K M V L K E V F S E G E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I E K N P L N D V A K K F G F E W E P L S D Y G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H M R Y K P Y A A L M V D L V N D Y S I K I A K
- - - - - - - - - - M V D L V N D Y S I K I A .
------------------------------TTTTTTGTGCATATTTAAGAATTGTTCTACTGCTTCGTC---
265266267268269270271272273274275276277278279280281282283284285286287288
E L P F P V F I V K G T N M F D L K Q G P V A E
. L P F P V F I V K G T N M F - - - - - - - - -
---TTTAGTGAAAACATGCAAATCAGGCATATAGAATTTTCTTAA---------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H A K L F G E R M Y E V Q S D K S V F V L R Y A
- - - - - - - - - - - - - - - - - - - V L R Y A
---------------------------------------------------------AGACAAAGTTAAATC
313314315316317318319320321322323324325326327328329330331332333334335336
A C F Q Q F A I A K D L T L S Y K N V P F G M L
A C F Q Q F - - - - - - - - - - - - - - F G M L
TTTGGCTATAGCGAATTG------------------------------------------GGATTGCACTTC
337338339340341342343344345346347348349350351352353354355356357358359360
E V A D S Y R F E Q P G E V V L A F R L R K F Y
E V A D S Y R F - - - - - - - - - - - - R K F Y
ATACATTCTTTCTCCGAATAGTTT------------------------------------CATGTTAGTGCC
361362363364365366367368369370371372373374375376377378379380381382383384
M P D L H V F T K D L D E A V E Q F L N M H K K
M P D L H V F - - - - - - - - - - F L N M H K K
TTTAACTATAAAAACTGGGAA------------------------------ATCATTAACTAAATCTACCAT
385386387388389390391392393394395396397398399400401402403404405406407408
I M E E I K K I G R D Y E L L I N V A S F E D Y
I M E E I K - - - - - - - - - - - - - - - - - -
TAGAGCAGCATAAGGTTT------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E K Y K Y I I E Q I Y K D V K K P L L L A I Y P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K S D Q R Y W I I N I E Y H I I D V L G R P R E
- - - - - - - - - N I E Y H I - - - - - - - - E
---------------------------TTCTATCCCATCTTTTGG------------------------ATT
457458459460461462463464465466467468469470471472473474475476477478479480
I G T T Q I D L H N S K R F G I K Y I D K D G S
I G T T Q I D - - - - - - - - - - - - - - - - -
CTCAATCTCTTTATAGTCCTT---------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E K H V I I L H N A I L G S I E R Y I Y A L F D
- - - V I I L H N A I . . S I E R Y I Y A - - -
---------ATAGACTTTATTTCCTTCTTCTTT------CTTTTTGGGCTTAATGGTTCTAGA---------
505506507508509510511512513514515516517518519520521522523524525526527528
T A L R K E K P V L P F W I S P V Q V R V I P V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
S E K Y L E Y A E Q I A K E L E S K F R V E L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D R D E T L N K K I K D A E S L W V P Y I I V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G E K E I K N N K I T V R D R Y E N K V Y E T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L E D L I S K M E E L Q K G Y P F R P L Y G P M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633
K L S L K P A N L
- - - - - - - - -
---------------------------
Class II
Archaea/Methanosarcina acetivorans/amino acid sequences/Methanosarcina_acetivorans_thr_aa
Archaea/Methanosarcina acetivorans/nucleotide sequences/Methanosarcina_acetivorans_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q L L L I H S D Y I E Y E T K K Q T P V A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I E E S L K S G R L E E A L T A F T A V E S V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E A N P E E A I E K A V S E I E K V A A Q V K T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N R I M L Y P Y A H L S S D L S S P K V A V Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L K G I E A A L S G K Y E V K R A P F G W Y K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
F T V S C K G H P L S E L S R S I H P E G T A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A A V K P E A A G E K E E V V S E A L K A E G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A R S Y W R I L T P D G E L H E V E T F D L T P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y P K L Q Q F V N Y E I S K S R A V E R A P P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V E L M R R L E L A D Y E P G S D S G N M R Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
P K G R L V K S L L E N Y V L D V A T E F G A M
- - - - - V K S L L E N Y V L D V A T E F G A M
---------------GTTAAGTCTCTTCTTGAAAACTACGTGCTTGATGTCGCAACCGAGTTCGGGGCAATG
265266267268269270271272273274275276277278279280281282283284285286287288
E V E T P L M Y D M N H P T L K K Y L D R F P A
E V E T P L M Y - - - - - - - - - - - - - - - -
GAAGTCGAAACTCCCCTGATGTAC------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
R Q Y S I E S D K R Q M F L R F A A C F G Q F L
- - - - - - - - - - - - F L R F A A C F G Q F -
------------------------------------TTCCTTCGCTTTGCAGCCTGTTTCGGGCAGTTC---
313314315316317318319320321322323324325326327328329330331332333334335336
M N H D M T I S Y K N L P L R M I E M T R Y S F
- - - - - - - - - - - - - L R M I E M T R . S F
---------------------------------------CTCAGGATGATCGAAATGACCCGT---AGTTTC
337338339340341342343344345346347348349350351352353354355356357358359360
R K E Q R G E L V G L R R L R A F T M P D M H T
R K - - - - - - - - - - - - R A F T M P D M H T
AGAAAA------------------------------------AGGGCTTTTACCATGCCGGATATGCACACC
361362363364365366367368369370371372373374375376377378379380381382383384
L C E D M N Q A V S Q F K E Q Y D L C I D V L E
L - - - - - - - - - - F K E Q Y D L C I D V L E
CTT------------------------------TTCAAGGAACAGTACGACCTCTGCATCGATGTGCTTGAA
385386387388389390391392393394395396397398399400401402403404405406407408
N V G I H I D D Y E V A I R F T R D F Y E S N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E L V V N M A K T V N K P V L V E M W D T R F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
Y F V L K F E F N F V D A L A K A S A L S T V Q
- - - - K F E F N F - - - - - - - - A L S T V Q
------------AAATTCGAGTTTAACTTC------------------------GCCCTTTCCACGGTCCAG
457458459460461462463464465466467468469470471472473474475476477478479480
I D V E N A E R Y D I S Y V N A D G K L E R P I
I D - - - - - - - - - - - - - - - - - - - - P I
ATCGAT------------------------------------------------------------CCGATC
481482483484485486487488489490491492493494495496497498499500501502503504
V L H C S P S G A I E R C I Y A L L E K A A M E
V L H C S P . . A I E R C I Y A - - - - - - - -
GTTCTCCACTGCTCGCCG------GCAATCGAACGTTGTATCTATGCC------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T E E G K V P M L P V W L S P T Q V R I V P I S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E K H L A F A E E V S K K L D C R V D I D D R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L S I G K K V R E A G R E W V P Y V V V I G D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
E M E E G T I N V T V R A E S E Q N K P S K V Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I T P E E L N A R I R G E I A G K P Y R K L P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635
A K Y L S A R P K F F
- - - - - - - - - - -
---------------------------------
Class II
Archaea/Pyrococcus horikoshii/amino acid sequences/Phorikoshii_thr_aa
Archaea/Pyrococcus horikoshii/nucleotide sequences/Phorikoshii_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R I L L I H S D Y I E Y E V K D K A I K N P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
P I S E E E K K G R M D E V L V A F I S V E K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D E T N P E E V V S K A V E E I I N V A S Q V K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A E N V F V Y P F A H L S S E L A K P S V A Q E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I L R K V Y E G L K E K G Y N V G K A P F G Y Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K A F K I S C K G H P L A E L S R T I I P E G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
K E E E V P E A L K K E E T E L V S Y W Y I L T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P E G E L I E V D K F D F T G Y E N L R K F A N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
Y E I S K S R I A E K E P P H V K L M L E H E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V D Y E P G S D P G N L R Y Y P K G R L I K S L
- - - - - - - - - - - - - - - - - - - - I K S L
------------------------------------------------------------ATCAAATCCCTT
241242243244245246247248249250251252253254255256257258259260261262263264
L E Q Y V T E K V I E Y G A M E V E T P V M Y D
L E Q Y V T E K V I E Y G A M E V E T P V M Y -
TTGGAGCAGTATGTGACCGAGAAAGTAATAGAGTATGGAGCTATGGAAGTTGAGACTCCCGTTATGTAT---
265266267268269270271272273274275276277278279280281282283284285286287288
F E H P A L E K Y L N R F P A R Q Y I V L S G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K K Y F L R F A A C F G Q F L I S K D A V I S Y
- - - F L R F A A C F G Q F - - - - - - - - - -
---------TTCCTAAGGTTTGCAGCATGTTTTGGACAGTTC------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
R H L P L R M Y E L T R Y S F R R E K R G E L S
- - - - L R M Y E L T R . S F R R - - - - - - -
------------CTAAGAATGTATGAACTAACTAGG---TCCTTTAGAAGA---------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G L R R L R A F T M P D M H T L A K D L E Q A K
- - - - - R A F T M P D M H T L - - - - - - - -
---------------AGGGCCTTCACAATGCCCGACATGCATACACTT------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
D E F K K Q F K L S M E V L K G V G L T P E D Y
- - F K K Q F K L S M E V L K - - - - - - - - -
------TTTAAGAAGCAGTTCAAGCTTAGTATGGAGGTTCTTAAA---------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
E V A I R F T E D F W K E N R D F I V E L V K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I G K P V L I E M W K Q R F F Y F I L K F E F N
- - - - - - - - - - - - - - - - - - - K F E F N
---------------------------------------------------------AAGTTCGAATTCAAC
433434435436437438439440441442443444445446447448449450451452453454455456
F V D N L D K A A A L S T V Q I D V E N A E R F
F - - - - - - - - A L S T V Q I D - - - - - - -
TTC------------------------GCCTTAAGCACGGTACAGATTGAC---------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G I K Y Y D E N G E E K Y P L I L H C S P S G A
- - - - - - - - - - - - - P L I L H C S P . . A
---------------------------------------CCCCTAATCCTTCACTGCTCTCCG------GCT
481482483484485486487488489490491492493494495496497498499500501502503504
I E R V M Y A I L E K Q A K L M Q E G K K P M L
I E R V M Y A - - - - - - - - - - - - - - - - -
ATCGAGAGGGTTATGTACGCT---------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P L W L S P I Q V R V I P V S E E Y L D Y A L Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I A G K L E G A R I R V D V D D E D E R L N K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I R R A E K E W I P Y I V V V G A K E K E S G T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I T V R R R E D G K Q Y E T R L E E L I K E I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E K V E G F P Y K P R P L P L L L S K R P K F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625
G
-
---
Class II
Archaea/Rhodothermus marinus/amino acid sequences/Rmarinus_thr_aa
Archaea/Rhodothermus marinus/nucleotide sequences/Rmarinus_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M Q T G V K M A G N G Q Q R E V I R I T F P D G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
S E R T F P K G I T G R E L A E Q I S P R L A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E A L A I K V N G E V W D L T R P I E E D A R V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R I L T W E D P E G K A V Y W H S T A H L M A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A L E A L Y P G V K F G I G P P I E Q G F Y Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V D L G G R K L S A E D L A R I E E K M R E L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
R R D V P Y E R I P V S K Q E A L E Y F K K K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
D P Y K V E L I E E L E D G T I T F Y R Q G N F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T D L C R G P H V P S T G Y I K H V K L L N V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G A Y W R G D E R R P Q L T R I Y G I S F P K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
K E L D E Y L H R L E E A R K R D H R R L G R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L E L F T F S Q K V G P G L P L W L P R G A T L
- - - - - - - - - - - - - - - - - - - - - - - L
---------------------------------------------------------------------GCG
289290291292293294295296297298299300301302303304305306307308309310311312
R E T L I N F L R E E Q I R R G Y Q P V V T P H
R E T L I N F L R E E Q I R R G Y Q P V V T P H
ATAGACCTGCCCGAACTCGGCCAGTCGGATCGGCAGCTCCCGGTAGGAGCGGGGCCGGTCGGCGTAGATCAT
313314315316317318319320321322323324325326327328329330331332333334335336
I A R L E L Y K T S G H Y P Y Y K D S Q F P P M
I A - - - - - - - - - - - - - - - - - - - - - -
GATGTG------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
I E N P E T G E G Y L L K P M N C P H H I M I Y
- - - - - - - - - - L L K P M N C P H H I - - -
------------------------------CCCGCTCGTCTTGTAAAGCTCCAGCCGGGCGAT---------
361362363364365366367368369370371372373374375376377378379380381382383384
A D R P R S Y R E L P I R L A E F G Q V Y R Y E
- - - - - - - - - - - I R L A E F G Q V Y R Y -
---------------------------------CTCGCGCAGGAAATTGATCAGCGTCTCGCGCAGCGT---
385386387388389390391392393394395396397398399400401402403404405406407408
Q T G E L S G L T R V R G F T I D D A H I F C R
- - - - - - - - - - - R G F T I D D A H I F - -
---------------------------------CACCTTCTGGCTGAAGGTGAACAGCTCCAGCTC------
409410411412413414415416417418419420421422423424425426427428429430431432
P D Q V K D E F K N V I D L T L Y V F R S L G F
- - - - - - - F K N V I D L T L Y V F R - - - -
---------------------GCGGGCCTCTTCGAGCCGGTGCAGGTATTCGTCGAGTTC------------
433434435436437438439440441442443444445446447448449450451452453454455456
D E F E A Q I S L R D P N N R E K Y V G D D E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
W E Q A E Q A I R E A A A E M G L Q A T E E L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
E A A F Y G P K L D F M V R D A L G R R W Q L G
- - - - - - - K L D F M V - - - - - - - - Q L G
---------------------GCCGTCTTCGAGTTCTTC------------------------GCCCTTCTT
505506507508509510511512513514515516517518519520521522523524525526527528
T V Q L D Y I L P E R F D L Y Y I G A D N Q K H
T V Q L D - - - - - - - - - - - - - - - - - - -
TTTGAAGTACTCCAG---------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R P V M I H R A P F G S L E R F I G V L I E H C
- P V M I H R A P . . S L E R F I G V - - - - -
---CATTTTTTCTTCGATGCGGGCCAG------GGCCGAGAGCTTGCGGCCGCCCAG---------------
553554555556557558559560561562563564565566567568569570571572573574575576
A G N F P L W L A P V Q V A V L P L S D E L N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Y A E A V G R R L L E A G F R V E V D T R T E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I G Y K I R Q A E V Q K I P Y M L I V G R R E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E A G T V A V R K H G E G D Q G P A T L D E F I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668
E R L R T E I E A A T R R A T V S E N A
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Archaea/Methanococcus jannaschii/amino acid sequences/Mjannaschii_thr_aa
Archaea/Methanococcus jannaschii/nucleotide sequences/Mjannaschii_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M R D N M K M L L I H S D Y L E F E A K E K T K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I A E E T E N L K G K L D E C L A C F I A V E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
E D E N N P E G T A I G A V E E I E K V A N Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K V N N I V V Y P Y A H L S S D L S S P E T A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K V L K D I E S I L K E R G Y N V L R A P F G W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
Y K A F K I S C K G H P L S E L S R K I V A K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E K K E E G E E S K F Y L L N P E T E E I I E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N E N N I N I I K D E E L L A L A K H E L G I R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
E H K E H D E P P H V K F I K E K D I C S Y E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
A S D P G H F R W Y P K G K L M R D L L A D Y V
- - - - - - - - - - - - - - - M R D L L A D Y V
---------------------------------------------ATGAGAGATTTGTTAGCTGATTATGTT
241242243244245246247248249250251252253254255256257258259260261262263264
Y N L V V N M G A M P V E T P I M Y D L G N P A
Y N L V V N M G A M P V E T P I M Y - - - - - -
TATAACTTAGTTGTCAATATGGGAGCTATGCCAGTAGAAACACCAATTATGTAT------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I R E H A D K F G E R Q Y R F R Q G N K E L M L
- - - - - - - - - - - - - - - - - - - - - - M L
------------------------------------------------------------------ATGCTA
289290291292293294295296297298299300301302303304305306307308309310311312
R F A A C F G Q F M M K K D M Y L L P R Y L P L
R F A A C F G Q F - - - - - - - - - - - - - - L
AGATTTGCAGCATGCTTTGGGCAGTTT------------------------------------------TTA
313314315316317318319320321322323324325326327328329330331332333334335336
K L Y E L S T Y S F R Y E Q R G E L V G L K R L
K L Y E L S T . S F R Y - - - - - - - - - - - -
AAACTCTATGAATTATCAACA---AGCTTTAGATAT------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R C F T M P D M H T V C L N L E Q A M E E F E K
R C F T M P D M H T V - - - - - - - - - - F E K
AGATGCTTTACAATGCCTGATATGCATACTGTC------------------------------TTTGAAAAA
361362363364365366367368369370371372373374375376377378379380381382383384
Q F W E C L K T G D D L N L S Y S V I F R F T K
Q F W E C L K T G D - - - - - - - - - - - - - -
CAGTTCTGGGAATGTTTAAAAACTGGGGAT------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
D F F D E H R D W F F K I A K E Y K N K Y G K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
V I L E I L P K R K H Y W V G K V D I A V I D S
- - - - - - - - - - - - - - - K V D I A V - - -
---------------------------------------------AAGGTAGATATTGCTGTA---------
433434435436437438439440441442443444445446447448449450451452453454455456
L G R P I E N P T V Q I D V E S A K R F D I K V
- - - - - E N P T V Q I D - - - - - - - - - - -
---------------GAGAACCCAACCGTGCAAATAGAT---------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
H T N E G E I Y P I I L H C S P T G S I E R V L
- - - - - - - - P I I L H C S P . . S I E R V L
------------------------CCAATAATATTGCACTGCTCACCA------TCAATTGAGAGGGTTTTG
481482483484485486487488489490491492493494495496497498499500501502503504
C G L L E K A A I E A E K G N A P M L P V W L S
C G - - - - - - - - - - - - - - - - - - - - - -
TGTGGT------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P I Q V R V I P V A E R H Y D Y A L K V A E K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
R E N N I R A D F D D R E E S V S K K I R N A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
K E W V P Y V V V I G D E E M E S D K L T V T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R E K S T L K K P Y K E K M T L D E L I E R I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
K E T A N Y P Y R P L P L P I R C S L Q P K F H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
Class II
Archaea/Halobacterium sp./amino acid sequences/Halobacterium_thr_aa
Archaea/Halobacterium sp./nucleotide sequences/Halobacterium_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S T V T V T L P D G S T L E L A S G A T V E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V A Y E I G P G L G R D T V A G K V D H E L V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K E T P L T E D C E I E I V T D Q S G D Y L D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L R H T A A H V L A Q A I L R H H P D A K L T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G P Y T E E G F Y Y D V A N V E L D A E D L D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I Q D E A D A I I E A D Y D V E Y V E Y D R E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A L E T Y D D N P F K R E I L E T E A A G D D P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
V S F Y R Q D D F E D L C R G P H V E S T G E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
G G F E V L E T S A A Y W R G D E E R E T L T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V Y G T A F P T E S E L D D Y L E R R A E A A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R D H R K I G S E M D L F S I P D V T G P G L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L Y H P N G K T V L R E L S E Y V H G L N R E M
- - - - - - - - V L R E L S E Y V H G L N R E M
------------------------TTCGCCGCGTTGCTCCTTGCGGTACACCTTCCCGTCCTCGAAGTACCG
289290291292293294295296297298299300301302303304305306307308309310311312
G Y D E V E T P H L F R T E L W K Q S G H Y D N
G Y D E V E T P H L F - - - - - - - - - - - - -
CACGGGGAGGTCGCGGTAGCTCCACGAGCCCTC---------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y V D D M F L L D V N D E E Y G L K P M N C P G
- - - - - - - - - - - - - - - G L K P M N C P G
---------------------------------------------GACGTAGTTGTCGTAGTGCCCGGACTG
337338339340341342343344345346347348349350351352353354355356357358359360
H A T I F N E G S W S Y R D L P V R Y F E D G K
H A - - - - - - - - - - - - - - V R Y F E D G K
CTTCCA------------------------------------------GCCCATCTCCCGGTTGAGCCCGTG
361362363364365366367368369370371372373374375376377378379380381382383384
V Y R K E Q R G E L S G L S R V W A F T I D D G
V Y R K - - - - - - - - - - - - W A F T I D D G
GACGTACTCCGA------------------------------------GAGCGGGAGGCCGGGGCCGGTGAC
385386387388389390391392393394395396397398399400401402403404405406407408
H V F A R A D Q I E Q E V R R L I D I I L E V L
H V F - - - - - - - - - V R R L I D I I L E V L
GTCCGGGAT---------------------------CTTCCGGTGGTCGCGCTCGGCGGCCTCCGCGCGGCG
409410411412413414415416417418419420421422423424425426427428429430431432
D T F D L D Y E V A L A T R P E K S V G S D E I
D - - - - - - - - - - - - - - - - - - - - - - -
CTC---------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
W E Q S E S Q L R D V L E E Q G M D Y D V E P G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
D G A F Y G P K I D F A F E D A L G R S W D G P
- - - - - - - K I D F A F - - - - - - - - D G P
---------------------CTCGAAGTCGTCCTGGCG------------------------CGCGGCCTC
481482483484485486487488489490491492493494495496497498499500501502503504
T V Q L D F N M P E R F D L E Y T G S D N D A H
T V Q L D - - - - - - - - - - - - - - - - - - -
GGTCTCCAGAATCTC---------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
Q P V M I H R A L Y G S Y E R F F M V L V E H Y
- P V M I H R A L . . S Y E R F F M V - - - - -
---CTCGACGTCGTAGTCGGCCTCAAT------GTCGGCCTCGTCCTGGATGGCGTC---------------
529530531532533534535536537538539540541542543544545546547548549550551552
D G R F P T W L A P E Q V R I L P V T D D N L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Y A H R V K N E L D G Y R V E V E D R D W T V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R K I Q Q A H D D N V P Y M L V L G D N E E E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G T V S V R D R Q E R E R N D V E L E T F R D H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640
F V G E V D E K R T Q P D F V E
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Chloroflexus aggregans/amino acid sequences/Caggregans_thr_aa
Bacteria/Chloroflexus aggregans/nucleotide sequences/Caggregans_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P V D P K S D P Y Y R L R H S L A H V M A Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
V L E I F P D A K I A I G P P I E N G F Y Y D F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D L P R P L T P E D L T E I E K R M K R I I A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
N H P F I Y R E V T A E E A R Q I F A N Q P Y K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
L E L I E G L A K G L D E Y G E T H H G D T V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S T Y R Q D T F E D L C R G P H L N H T G E I N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
P E A F K L M S I A G A Y W R G D E K N R Q L Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
R I Y G T G W N T K E E L E A Y L H R L E E S R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R R D H R R L G K E L G L F F F S D D I G P G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
P I F S P K G E I I R H E M E K F V R E V Q T R
- - - - - - - - - I R H E M E K F V R E V Q T R
---------------------------GGTAAACTTGTACGTTCCCAGCACCTCGCGGATCACTTGCAGGGC
241242243244245246247248249250251252253254255256257258259260261262263264
Y G Y Q H V W T G N V V K E Q L Y R K S G H Y D
Y G Y Q H V W T G N V V - - - - - - - - - - - -
AAGACTAAACTCCTCTTGAATCTGATCGGGTCGGCA------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
N Y R D S M F P P M V E S E D L I F R L K P M N
- - - - - - - - - - - - - - - - - - R L K P M N
------------------------------------------------------CTCGGCAAAGCGCAGCGG
289290291292293294295296297298299300301302303304305306307308309310311312
C P S H M T L Y N Q L G V I S Y R D L P L R F A
C P S H M - - - - - - - - - - - - - - - L R F A
TAGATCGCGATAACT---------------------------------------------CATCGGCTTGAG
313314315316317318319320321322323324325326327328329330331332333334335336
E F A T L Y R Y E D S G A L S G L T R V R A L T
E F A T L Y R Y - - - - - - - - - - - - R A L T
GCGAAAGATGAGGTCTTCGCTCTC------------------------------------GTAGTGCCCCGA
337338339340341342343344345346347348349350351352353354355356357358359360
Q D D C H I F C R P D Q I Q E E F S L A L Q V I
Q D D C H I F - - - - - - - - - F S L A L Q V I
CTTCCGATAGAGCTGCTCCTT---------------------------ATACCCGTAGCGCGTTTGCACCTC
361362363364365366367368369370371372373374375376377378379380381382383384
R E V L G T Y K F T D Y K V R L S L R G K E G K
R E V L G - - - - - - - - - - - - - - - - - - -
ACGCACAAATTTTTC---------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
Y V Q D D E K W E L A T A A L R A A L E A N G V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
E Y F E A E G E A A F Y G P K A D F L A R D V L
- - - - - - - - - - - - - - K A D F L A - - - -
------------------------------------------GGTACCGTAAATACGCTG------------
433434435436437438439440441442443444445446447448449450451452453454455456
G R E W Q L S T I Q V D F I Q P A R L G C E Y I
- - - - Q L S T I Q V D - - - - - - - - - - - -
------------GCGCCAGTATGCCCCGGCGATGCT------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G E D D K P H T P V V L H R A V T G T T E R F M
- - - - - - - - P V V L H R A V T . . T E R F M
------------------------CAGATCCTCGAACGTATCTTGACGGTA------GATGACAGTGTCGCC
481482483484485486487488489490491492493494495496497498499500501502503504
G I L I E H Y A G A F P L W L A P V Q A V I I P
G I - - - - - - - - - - - - - - - - - - - - - -
GTGATG------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I T D K Q M E Y A R K V R Q R L F A A G L R V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
L D E N R D R M Q G K I R R A Q L Q K I P Y M L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I I G A R E E S A D A V A V R T R A G D D L G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594
M P V E A F L A R A L E E I R T R S
- - - - - - - - - - - - - - - - - -
------------------------------------------------------
Class II
Bacteria/Campylobacter jejuni/amino acid sequences/Cjejuni_thr_aa
Bacteria/Campylobacter jejuni/nucleotide sequences/Cjejuni_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M E K E V I A Y L D N E T I I D S Q S V K N T N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L K E I Y F D N S K E S L E V I R H S C A H L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
A Q A I K S L Y P E A K F F V G P V I E D G F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
Y D F R V E S K I G E E D L V K I E K K M K E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A E A K I E I S K Y E I T K S E A L A K F Q N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
D L K Q E V L L R I P D R A V S I Y K Q G E F E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
D L C R G P H V P N T K F L R F F K L T R V A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A Y L G G D E K R E M L T R I Y G T A F A D K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S L K E Y L T I I E E A K K R D H R K L G T E L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
K L F T F D D E I G G G L P I W L S N G A R L R
- - - - - - - - - - - - - - - - - - - - - - L R
------------------------------------------------------------------CTTAGA
241242243244245246247248249250251252253254255256257258259260261262263264
S K L E H M L Y K I H R L R G Y E P V R G P E L
S K L E H M L Y K I H R L R G Y E P V R G P E L
TCTAAACTTGAACATATGCTTTATAAGATCCATCGTTTACGTGGTTATGAGCCTGTGCGTGGGCCTGAACTT
265266267268269270271272273274275276277278279280281282283284285286287288
L K A D A W K I S G H Y A N Y K E N M Y F T Q I
L - - - - - - - - - - - - - - - - - - - - - - -
TTA---------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D E Q E Y G I K P M N C V G H I K I Y Q S D V R
- - - - - G I K P M N C V G H I - - - - - - - -
---------------GGCATTAAGCCTATGAACTGTGTGGGACATATT------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S Y R D L P L K F F E Y G V V H R H E K S G V L
- - - - - - L K F F E Y G V V H R H - - - - - -
------------------TTGAAATTTTTTGAATACGGCGTGGTACATCGTCAT------------------
337338339340341342343344345346347348349350351352353354355356357358359360
H G L F R V R E F T Q D D A H I F C M P S Q I K
- - - - - - R E F T Q D D A H I F - - - - - - -
------------------AGAGAATTCACTCAAGATGATGCACATATTTTT---------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E Q V L E I L A F V D N L M K L F D F S Y E M E
- - V L E I L A F V D N L M K - - - - - - - - -
------GTTTTAGAAATTTTAGCTTTTGTGGATAATTTGATGAAA---------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
I S T K P E K A I G D D E I W E I A T K A L K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A L D E Q G L K Y G I D E G G G A F Y G P K I D
- - - - - - - - - - - - - - - - - - - - - K I D
---------------------------------------------------------------AAGATTGAT
433434435436437438439440441442443444445446447448449450451452453454455456
I K I T D A L K R K W Q C G T I Q V D F N L P S
I K I - - - - - - - - Q C G T I Q V D - - - - -
ATTAAAATC------------------------CAATGCGGAACCATACAAGTAGAT---------------
457458459460461462463464465466467468469470471472473474475476477478479480
R F K L E Y T D S D N E K K Q P V M L H R A I L
- - - - - - - - - - - - - - - P V M L H R A I .
---------------------------------------------CCTGTAATGTTGCATCGTGCGATT---
481482483484485486487488489490491492493494495496497498499500501502503504
G S F E R F I G I L T E H C A G E F P F F I A P
. S F E R F I G I - - - - - - - - - - - - - - -
---TCTTTTGAAAGATTTATAGGAATT---------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
T A V G I V P I G E A H I A Y A K E I Q K E L L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E L N I D S E V Y E K N E S L S K K I R I A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
Q K L P M I L V L G D D E V A K R S V A L R D R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R A K E Q K N L S L D E F I K L V K E K M S E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602
H F
- -
------
Class II
Bacteria/Synechococcus elongatus/amino acid sequences/Selongatus_thr_aa
Bacteria/Synechococcus elongatus/nucleotide sequences/Selongatus_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M V Q S A P S T E A I Q L P K T S E S A Q L K R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
I R H T M S H V M A M A V Q K L F P K A Q V T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
G P W T E T G F Y Y D F D T P E P F T E A D L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A I K K E M V K I I Q Q K L P V V R E E V S R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
E A Q Q R I E A L G E P Y K L E I L Q G L T E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I T L Y H L G D R W W D L C A G P H V E T T A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L N P K A F D L E S V A G A Y W R G D E T K A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L Q R I Y G T A W E T P E Q L T E Y K R R K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A L K R D H R K L G R E L G L F L F A D P V G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G L P L W T P K G T I L R S T L E D F L K Q E Q
- - - - - - - - - - - L R S T L E D F L K Q E Q
---------------------------------GAACTTTTTGAGATTGAGCGCCTTGAAGACAGACAGAAT
241242243244245246247248249250251252253254255256257258259260261262263264
M K R G Y Q S V V T P H L A R V D L F K V S G H
M K R G Y Q S V V T P H L A - - - - - - - - - -
GAGATCGACAACGCTCAAGAACTCAGACGCCAGCTGATCGGG------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
W Q N Y R E D M F P M M A E D D E A R G L E Q G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
F V L K P M N C P F H I Q I Y K N E L R S Y R E
- V L K P M N C P F H I - - - - - - - - - - - -
---ACGAATCGGGAGTTCGCGATAGGAGCGCAGTTC------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
L P I R L A E F G T V Y R Y E Q S G E L G G L T
- - I R L A E F G T V Y R Y - - - - - - - - - -
------GAGTACAAAGCCTTGCTCCAGCCCACGGGCTTCATC------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
R V R G F T V D D S H L F V R P D Q L A S E F L
- - R G F T V D D S H L F - - - - - - - - - F L
------GTTTTGCCAGTGCCCTGAAACTTTAAAGAGGTC---------------------------TGATTG
361362363364365366367368369370371372373374375376377378379380381382383384
S V V D L I L S V F K A L N L K K F K A R L S F
S V V D L I L S V F K - - - - - - - - - - - - -
ATAGCCACGCTTCATTTGTTCCTGCTTGAGGAA---------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R D P E S D K Y I G S D D V W E K A E S A I Q A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
A A E T L G M D Y F I G V G E A A F Y G P K L D
- - - - - - - - - - - - - - - - - - - - - K L D
---------------------------------------------------------------GGCGGTGCC
433434435436437438439440441442443444445446447448449450451452453454455456
F I F Q D A L D R E W Q L G T V Q V D Y N L P E
F I F - - - - - - - - Q L G T V Q V D - - - - -
ATAAATCCG------------------------ACCGCGCCAGTAGGCACCTGCCAC---------------
457458459460461462463464465466467468469470471472473474475476477478479480
R F D L E Y V A E D G S R Q R P V M I H R A P F
- - - - - - - - - - - - - - - P V M I H R A P .
---------------------------------------------ACAGAGATCCCACCAGCGATCGCC---
481482483484485486487488489490491492493494495496497498499500501502503504
G S L E R L I G I L I E E Y A G D F P L W L A P
. S L E R L I G I - - - - - - - - - - - - - - -
---ATAGAGCGTGATCGGCTCAGTTAA---------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E Q I R L L P V T E T V L D Y C Q Q V A D Q L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A I G V R V Q V D C S G D R L G K L I R N A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A K I P V M A V I G A Q E A E S E T L S I R T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A T G D L G S L T V A D L T K R L S S A I A E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604
L P H L
- - - -
------------
Class II
Bacteria/Bacteroides fragilis/amino acid sequences/Bfragilis_thr_aa
Bacteria/Bacteroides fragilis/nucleotide sequences/Bfragilis_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M I K I T F P D G S V R E Y N E G V N G L Q I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E S I S S R L A Q D V L A C G V N G E I Y D L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
R P I N E D A S V V L Y K W E D E Q G K H A F W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H T S A H L L A E A L Q E L Y P G I Q F G I G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
A I E N G F Y Y D V D P G E A V I K E A D L P A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I E A K M A E L V A K K E A V V R R D I A K G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A L K M F G D R G E T Y K C E L I S E L E D G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I T T Y T Q G D F T D L C R G P H L M T T A P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K A I K L T S V A G A Y W R G H E D R K M L T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
I Y G I T F P K K K M L D E Y L A L M E E A K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
R D H R K I G K E M Q L F M F S D T V G K G L P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
M W L P K G T A L R L R L Q D F L R R I Q T R Y
- - - - - - - - L R L R L Q D F L R R I Q T R Y
------------------------TTGCGTTTGCGCTTACAGGACTTCTTGCGCCGTATACAGACTCGTTAT
289290291292293294295296297298299300301302303304305306307308309310311312
D Y Q E V I T P P I G N K L L Y V T S G H Y A K
D Y Q E V I T P P I G - - - - - - - - - - - - -
GACTATCAGGAGGTGATTACTCCGCCTATCGGT---------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y G K D A F Q P I H T P E E G E E Y F L K P M N
- - - - - - - - - - - - - - - - - - F L K P M N
------------------------------------------------------TTCCTGAAGCCGATGAAC
337338339340341342343344345346347348349350351352353354355356357358359360
C P H H C E I Y K N F P R S Y K D L P L R I A E
C P H H C - - - - - - - - - - - - - - L R I A E
TGTCCTCATCATTGT------------------------------------------TTACGTATTGCCGAA
361362363364365366367368369370371372373374375376377378379380381382383384
F G T V C R Y E Q S G E L H G L T R V R S F T Q
F G T V C R Y - - - - - - - - - - - - R S F T Q
TTCGGAACTGTTTGTCGGTAC------------------------------------CGTAGTTTTACTCAG
385386387388389390391392393394395396397398399400401402403404405406407408
D D A H I F C R P D Q V K G E F L R V M D I I S
D D A H I F - - - - - - - - - F L R V M D I I S
GATGATGCACATATTTTC---------------------------TTCCTCCGTGTAATGGACATTATTTCG
409410411412413414415416417418419420421422423424425426427428429430431432
I V F R S M D F D N F E A Q I S L R D K V N R E
I V F R - - - - - - - - - - - - - - - - - - - -
ATTGTGTTCCGT------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K Y I G S D E N W E K A E Q A I I E A C E E K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L K A K I E Y G E A A F Y G P K L D F M V K D A
- - - - - - - - - - - - - - - K L D F M V - - -
---------------------------------------------AAATTGGATTTTATGGTG---------
481482483484485486487488489490491492493494495496497498499500501502503504
I G R R W Q L G T I Q V D Y N L P E R F E L E Y
- - - - - Q L G T I Q V D - - - - - - - - - - -
---------------CAGTTAGGTACTATCCAGGTTGAC---------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
M G S D N Q K H R P V M I H R A P F G S M E R F
- - - - - - - - - P V M I H R A P . . S M E R F
---------------------------CCGGTAATGATTCACCGTGCTCCG------TCTATGGAACGCTTT
529530531532533534535536537538539540541542543544545546547548549550551552
V A V L I E H T A G K F P L W L T P E Q V V I L
V A V - - - - - - - - - - - - - - - - - - - - -
GTCGCTGTA---------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P I S E K F N E Y A E K V K T Y L K M K E I R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
I V D D R N E K I G R K I R D N E M K R I P Y M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
L I V G E K E A E N G E V S V R R Q G E G D K G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646
T M K F E E F G E I L N E E V Q N M I N K W
- - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------
Class II
Bacteria/Thermus thermophilus/amino acid sequences/Tthermophilus_thr_aa
Bacteria/Thermus thermophilus/nucleotide sequences/Tthermophilus_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M T V Y L P D G K P L E L P E G A T A K D V A R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A L G E G W E R R A V G A I V D G E L Y D L L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P L P Q G A K V R L L T E K D P E F Q T L F R H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T L A H V L A Q A V K E F F R E K G Y D P E S V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R L G V G P V I E K G F Y Y D I E A P E P L S D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E D L P A I E A K M R E I L K R D L P L R R F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L S R E E A L A R Y R G K D P Y K T E L V L E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P E G E E I S F Y Q Q G D E A Y G F T D L C R G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
P H V P S T G R I P P H F K L T H V A G A Y W R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G D E N R P M L Q R V Y G V A F R T A E E L K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Y L W Q L E E A K K R D H R R L G R E L E L F L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I D P L V G K G L V L W L P K G N V V R E E L M
- - - - - - - - - - - - - - - - - - V R E E L M
------------------------------------------------------GTCCGGGAGGAGCTCATG
289290291292293294295296297298299300301302303304305306307308309310311312
A F M R E E Q V R R G Y Q L V T T P H I G S L E
A F M R E E Q V R R G Y Q L V T T P H I G - - -
GCCTTCATGCGGGAGGAGCAGGTGAGGCGGGGCTACCAGCTCGTGACCACGCCCCACATCGGG---------
313314315316317318319320321322323324325326327328329330331332333334335336
L Y K T S G H Y P Y Y A E S Q F P P I S F K E R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G E E E E Y L L K P M N C P H H I R I Y A Y R K
- - - - - - L L K P M N C P H H I - - - - - - -
------------------CTCCTCAAGCCCATGAACTGCCCCCACCACATC---------------------
361362363364365366367368369370371372373374375376377378379380381382383384
R S Y R E L P L R L A E F G T V Y R Y E K A G E
- - - - - - - L R L A E F G T V Y R Y - - - - -
---------------------CTAAGGCTTGCCGAGTTCGGCACCGTCTACCGCTAC---------------
385386387388389390391392393394395396397398399400401402403404405406407408
L L G L T R V R G F T Q D D A H I F C T P E E V
- - - - - - - R G F T Q D D A H I F - - - - - -
---------------------AGGGGCTTCACCCAGGACGACGCCCACATCTTC------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K G E F L G V L D L V L K V F A T L G L K D Y R
- - - F L G V L D L V L K V F A - - - - - - - -
---------TTCCTCGGGGTCTTGGACCTGGTGCTTAAGGTCTTCGCC------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
A R I G V R D P K S D K Y V G D E A K W A L A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
R Q I E E A A A E A G L R Y T V E E G D A A F Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
G P K L D F V V K D A L G R E W Q L G T I Q V D
- - K L D F V V - - - - - - - - Q L G T I Q V D
------AAGCTGGACTTCGTGGTG------------------------CAGCTCGGCACCATCCAGGTGGAC
505506507508509510511512513514515516517518519520521522523524525526527528
Y N L P E R F G L T Y V G K D G E E H R P V M L
- - - - - - - - - - - - - - - - - - - - P V M L
------------------------------------------------------------CCCGTGATGCTC
529530531532533534535536537538539540541542543544545546547548549550551552
H R A P F G S L E R F I G I L I E H F A G D F P
H R A P . . S L E R F I G I - - - - - - - - - -
CACCGGGCCCCC------TCCCTGGAGCGCTTCATCGGCATC------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
L W L A P V Q A V V V P V S E K Q E D Y A R E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
A G R L K E A G L R A E A D T R P E R M Q A R I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
R D A E V Q K V P Y I L V V G E R E K A E G A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
S V R R R K K G N L G T M P L A A F L E G A L R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659
E Y R E R R L E P V F
- - - - - - - - - - -
---------------------------------
Class II
Bacteria/Herpetosiphon aurantiacus/amino acid sequences/Haurantiacus_thr_aa
Bacteria/Herpetosiphon aurantiacus/nucleotide sequences/Haurantiacus_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P P V N P D N D P L Y R L R H S T A H V L A Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A V L E I F P E G K I A I G P P V E N G F Y Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F D L P R P L T P D D L K D I E A K M R K I I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
A K H R F A Y R E V S A D E A R E L F K N Q P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K L E L I A G L A K G E D E Y G E K A A A S D T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I I S T Y K H D S F E D L C K G P H V E S L G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
I P P N G F K L L R V S G A Y W R G D E K R P M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
L Q R I Y G T V W P S K E E L D H Y L W Q Q E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
A K K R D H R K L G R E L G L F T F S Q K V G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G L A L W L P K G A I L R D V L E R F L R Q A Q
- - - - - - - - - - - L R D V L E R F L R Q A Q
---------------------------------CAAGCCCATCGTGCCAAACACGAAGAGAATCAAGTCAAC
241242243244245246247248249250251252253254255256257258259260261262263264
I E R G Y L P V V T P H M G K I D L Y K T S G H
I E R G Y L P V V T P H M G - - - - - - - - - -
GACTTTCAAAAATTCTGCTTCGAGCTGATCGGGCGTGACGAA------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
W Y T Y R D G I F P P M R E I E N D D T E N P E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
G E I Y L L K P M N C P H H I E I Y A S E P R S
- - - - L L K P M N C P H H I - - - - - - - - -
------------ATACGAACGTGGTTCGCTAGCATAAATTTCAAT---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
Y R D L P L R L A E F G T V Y R Y E H S G E L T
- - - - - L R L A E F G T V Y R Y - - - - - - -
---------------CTCTGGATTTTCCGTGTCATCATTTTCAATTTCGCG---------------------
337338339340341342343344345346347348349350351352353354355356357358359360
G L L R V R S F T V D D S H L F V T P D Q L E A
- - - - - R S F T V D D S H L F - - - - - - - -
---------------GTGCCCGCTCGTTTTGTAAAGATCGATCTTGCC------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E F L K V V D L I L F V F G T M G L K D F Q A R
- F L K V V D L I L F V F G - - - - - - - - - -
---GCCGCGTTCGATTTGAGCTTGGCGCAAAAATCGCTCCAA------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
V G L R E V G N P K Y I G S D E V W E K A Q N A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
I I N A A E K K G L N Y I V V E G E A A F Y G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K L D F I F R D V L G R Q W Q L G T V Q V D Y N
K L D F I F - - - - - - - - Q L G T V Q V D - -
ATAAATCCGTTGCAACAT------------------------GTATGCGCCCGAAACTCGCAGCAA------
457458459460461462463464465466467468469470471472473474475476477478479480
L P E R F E I E Y T G E D G Q K H R P I M I H R
- - - - - - - - - - - - - - - - - - P I M I H R
------------------------------------------------------TTCAAACGAATCGTGTTT
481482483484485486487488489490491492493494495496497498499500501502503504
A P F G S I E R F V G T L I E Q Y A G A F P V W
A P . . S I E R F V G T - - - - - - - - - - - -
GTAGGT------GATCGTATCGCTGGCAGCGGCTTT------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
L A P V Q V T L V P I T D R H V A Y A E S V A A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
K L N A Q G L R V E V D A S N N R M N A K I R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
A Q K L K I P Y M L V V G D K E E E A G A V A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
R Q R S G G D L G S I S V D E F I A R I K D E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604
A N Y Q
- - - -
------------
Class II
Bacteria/Thermotoga maritima/amino acid sequences/Tmaritima_thr_aa
Bacteria/Thermotoga maritima/nucleotide sequences/Tmaritima_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M K I K V K L P D G K E K E Y D R G I T P A E I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A K E L G I K K A I G A V V N G E L W D L K R P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I E N D C E L R L V T L E D P E A P E F Y R H T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
M A H I L A Q A V M R L Y G K E N V K L G I G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
T I E N G F Y Y D F D I K N G R L T E E D L P K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
I E Q E M K K I I K E N L P I E R K E I S K E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
A R E L F R D Q P Y K L E L I E E I E G N R V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
I Y R Q G E F V D L C R G P H L P S T G I V K H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
F K L L S V S G A Y W R G S E K N P M L T R V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G T A F A K K E D L D N Y L K F L E E A Q R R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
H R K L G P Q L E L F M L N T E Y A P G M P F F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
L P K G V V V L N E L M K F S R E L H R E R G Y
- - - - - - V L N E L M K F S R E L H R E R G Y
------------------GAGACCGTGGAGAACTCCGCTTCTCTCGTATCTGTGAACCCGGCCAAACTCGAA
289290291292293294295296297298299300301302303304305306307308309310311312
Q E I F T P L I M N E Q L W K I S G H W D H Y A
Q E I F T P L I M - - - - - - - - - - - - - - -
GAATCTCAGCGGTAGGTCCCTGTAGGA---------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
E N M Y F I E K D E E R Y A V K P M N C P G H I
- - - - - - - - - - - - - A V K P M N C P G H I
---------------------------------------GTACATGTTCTCAGCGTAGTGATCCCAGTGACC
337338339340341342343344345346347348349350351352353354355356357358359360
L V Y K S R T V S Y R D L P L R F F E F G R V H
- - - - - - - - - - - - - - L R F F E F G R V H
------------------------------------------GATCTCCTGGTATCCTCTCTCACGATGGAG
361362363364365366367368369370371372373374375376377378379380381382383384
R Y E R S G V L H G L M R V R S F T Q D D A H I
R Y - - - - - - - - - - - - R S F T Q D D A H I
TTCTCT------------------------------------CTTTGGAAGGAAGAACGGCATACCGGGAGC
385386387388389390391392393394395396397398399400401402403404405406407408
F C T P D Q I E E E I L G V L D L I N T I Y S Q
F - - - - - - - - - I L G V L D L I N T I Y S -
GTA---------------------------TTGAGGTCCCAATTTTCTGTGGTCCCTTCGCTGGGCTTC---
409410411412413414415416417418419420421422423424425426427428429430431432
F G F T Y R V E L S T M P E D H M G D E A I W E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
K A T T A L K N A L E R A G L S Y K V N E G E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
A F Y G P K I D F H I R D S I G R E W Q C A T I
- - - - - K I D F H I - - - - - - - - Q C A T I
---------------TCTGCAGAGATCCACGAA------------------------TCTGTTGCCTTCGAT
481482483484485486487488489490491492493494495496497498499500501502503504
Q L D F M M P E K F N V T Y I G P D N K E H R A
Q L D - - - - - - - - - - - - - - - - - - - - A
CTCCTCTAT------------------------------------------------------------CTT
505506507508509510511512513514515516517518519520521522523524525526527528
V M I H R A I Y G S L E R F F G I L I E H F A G
V M I H R A I . . S L E R F F G I - - - - - - -
TCTTTCTATAGGAAGATTTTC------TATCTTCTTCATCTCCTGTTCTAT---------------------
529530531532533534535536537538539540541542543544545546547548549550551552
A F P T W L A P I Q V A V I P I S E K H N D G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
E K V A R R I S Q E G F R V F F D N R R E T L G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
Y R I R Q A Q T Q K I P Y M I I I G D K E L E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
G K I S V R T R T G K E I K D V D P E H F V E T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640
L R N E V L S R K L E L S M E G
- - - - - - - - - - - - - - - -
------------------------------------------------
Class II
Bacteria/Bacillus licheniformis/amino acid sequences/Blicheniformis_thr_aa
Bacteria/Bacillus licheniformis/nucleotide sequences/Blicheniformis_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S E S L I K V Q F K E G N T K E F P K G I T I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
K R I A E S I S T T L R K H A V V A K V D E K F
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
V D L S Y T L D K D V K L D I F T L D S K E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S V L R H T S T H I L A H A V K R L Y S S V S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G I G P V I E D E F F Y D L K L E H S L S P E D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L L A I E R E M E K I I K E N I E I K R I V V S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
Y E E A E K L F E E N N E P L K L E I L R G I P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K G Q E I T L Y Q Q G E F I D L C R G P H L P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T G F I K A F K L T R V S G A Y W R G N R Q K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V L Q R V Y G V A F K K K D D L N E Y L Y F L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
Q A A K H D H R Q L G K Q L D L F M F S E E A P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G M P F Y L P K G Q I V R K E L E K L S R E L Q
- - - - - - - - - - - V R K E L E K L S R E L Q
---------------------------------GTTAGAAAAGAATTGGAGAAATTATCCCGTGAACTTCAA
289290291292293294295296297298299300301302303304305306307308309310311312
N N A S Y D E V H T P F M M N Y R L W E K S G H
N N A S Y D E V H T P F M M - - - - - - - - - -
AATAATGCATCGTACGATGAGGTCCATACACCGTTTATGATG------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
W D H Y Q E N M Y F S E V D N T K F A I K P M N
- - - - - - - - - - - - - - - - - - A I K P M N
------------------------------------------------------GCAATCAAACCAATGAAT
337338339340341342343344345346347348349350351352353354355356357358359360
C P G H M L I F K N N L Y S Y R D L P I R L A E
C P G H M - - - - - - - - - - - - - - I R L A E
TGTCCTGGACATATG------------------------------------------ATTCGATTGGCGGAA
361362363364365366367368369370371372373374375376377378379380381382383384
Y G Q V H R H E F S G S L N G L L R V R T F C Q
Y G Q V H R H - - - - - - - - - - - - R T F C Q
TATGGACAAGTTCATCGACAT------------------------------------CGCACATTTTGTCAG
385386387388389390391392393394395396397398399400401402403404405406407408
D D A H I F V R E D Q I E S E I K K V F H L I D
D D A H I F - - - - - - - - - I K K V F H L I D
GATGACGCTCACATCTTT---------------------------ATTAAGAAGGTATTTCATTTAATTGAC
409410411412413414415416417418419420421422423424425426427428429430431432
Q V Y R T I G F E Y S V E L S T R P D D S L G N
Q V Y R - - - - - - - - - - - - - - - - - - - -
CAAGTGTATCGT------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N H L W E V S E G S L K N V L D D L A I K Y Q V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
N E G D G A F Y G P K I D F H I K D A L K R S H
- - - - - - - - - - K I D F H I - - - - - - - -
------------------------------AAAATTGATTTCCATATT------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q C G T I Q L D F Q M P E K F D L T Y I N H N N
Q C G T I Q L D - - - - - - - - - - - - - - - -
CAGTGCGGAACAATCCAACTTGAT------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
E K V R P V V I H R A I F G S I D R F F G I L I
- - - - P V V I H R A I . . S I D R F F G I - -
------------CCTGTTGTTATCCACCGTGCTATT------TCTATTGATCGTTTTTTTGGAATT------
529530531532533534535536537538539540541542543544545546547548549550551552
E H F A G V F P V W L A P I Q V Q I I P I S H I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
H L E Y C L G I K S E L K Q H G I R V Q I N E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
N Q K L G Y K I R E A Q V Q K I P Y T L V V G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
N E I K E N G V N V R K Y G E E Q Q K N V S I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639
S F K K N I L Q Q I K T R S V
- - - - - - - - - - - - - - -
---------------------------------------------
Class II
Bacteria/Borrelia burgdorferi/amino acid sequences/Bburgdorferi_thr_aa
Bacteria/Borrelia burgdorferi/nucleotide sequences/Bburgdorferi_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S K D L D K E D I L Y K K R H S I A H V M A E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A V L D L F P N T K I A I G P P I K D G F Y Y D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
F E F K K Q I T E D S L L D I E N R M R E I L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
T G S S F E K E I I S V E Q A L E I F K D E P Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
K I D L I K N F D L Q N E V S I Y K S H N F V D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
L C R G P H V E N M N K I D P K A F K L T S I A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
G A Y W R G S E K N P M L T R I Y G T L W N N E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
K E L R S Y L N L R E E I K K R D H R K L G K E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
L D L F S I H E E I G P G L V F F H P N G A K I
- - - - - - - - - - - - - - - - - - - - - - - I
---------------------------------------------------------------------ATA
217218219220221222223224225226227228229230231232233234235236237238239240
R A L I E D F W R E E H S K N G Y D I L F T P H
R A L I E D F W R E E H S K N G Y D I L F T P H
AGAGCTTTAATAGAAGATTTTTGGAGAGAAGAGCACTCCAAAAATGGGTATGATATTCTTTTTACTCCTCAT
241242243244245246247248249250251252253254255256257258259260261262263264
I G K S W L W Q T S G H L D F Y K D S M F E K I
I G - - - - - - - - - - - - - - - - - - - - - -
ATTGGC------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
E M D K S D Y Y L K P M N C P F H I A I Y N T G
- - - - - - - Y L K P M N C P F H I - - - - - -
---------------------TATCTTAAACCCATGAATTGTCCTTTTCATATT------------------
289290291292293294295296297298299300301302303304305306307308309310311312
K H S Y R D L P F R W A E L G T V Y R Y E K I G
- - - - - - - - F R W A E L G T V Y R Y - - - -
------------------------TTTAGATGGGCCGAGCTTGGCACTGTGTATCGTTAT------------
313314315316317318319320321322323324325326327328329330331332333334335336
A L H G M M R A R G F T Q D D A H I I C T H S Q
- - - - - - - - R G F T Q D D A H I I - - - - -
------------------------AGAGGGTTTACTCAGGATGATGCTCATATTATA---------------
337338339340341342343344345346347348349350351352353354355356357358359360
V L D E I K E V L R F A I Y M W S K F G F S N L
- - - - I K E V L R F A I Y M W S - - - - - - -
------------ATTAAAGAAGTTCTTAGGTTTGCTATTTATATGTGGAGT---------------------
361362363364365366367368369370371372373374375376377378379380381382383384
K A Y L S T K P D K S V G N D S D W E M S L K V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
L E E T L S D F E V P Y E I D K G G G A F Y G P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
K I D L K I V D S L E R E W Q M S T I Q F D F N
K I D L K I - - - - - - - - Q M S T I Q F D - -
AAAATTGATCTTAAGATA------------------------CAGATGAGTACAATTCAATTTGAT------
433434435436437438439440441442443444445446447448449450451452453454455456
L P E R F N M T Y T A E D G K E K R P F M I H R
- - - - - - - - - - - - - - - - - - P F M I H R
------------------------------------------------------CCATTTATGATTCATAGA
457458459460461462463464465466467468469470471472473474475476477478479480
A L L G S I E R F F G I L V E H Y G G A F P L W
A L . . S I E R F F G I - - - - - - - - - - - -
GCTTTG------TCTATTGAAAGATTTTTTGGAATT------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
L S P V Q V V I I P V N N I V E D Y A I K V F N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
K F K N E G I R I K L D N S S S R M N A K I R E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
Y Q A K K I P Y M F I I G E R E A I E E R I S I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R T R T N E Q I N G M K L D E A L K F I L F K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581
R D K E I
- - - - -
---------------
Class II
Bacteria/Candidatus Amoebophilus asiaticus/amino acid sequences/CAmoebophilusAsiaticus_thr_aa
Bacteria/Candidatus Amoebophilus asiaticus/nucleotide sequences/CAmoebophilusAsiaticus_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H N H T V N I A L P D G T I K S F A K G V T S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L E I A Q S I S E R L S Q Q I L A S L V N G E V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
W D I T R P I T E D A A V K L L T W Q D E D G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
K A F W H S S A H L M A E A L E S L Y P G I K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
G I G P A I A N G F Y Y D I D F G D Y D F D A T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
H L P R I E E K M L E L A R Q N N L Y Q G I V V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N K P A A I S F F Q K K G D P Y K V E L L E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
Q D G S I T F Y K H G N F T D L C R G P H I P H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
T G F I K A V K L L N I S G A Y W R G N E K N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
Q L T R I Y G I T F P Q Q K E L K A Y L E L L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
E A Q K R N H Q K I G K E L K L F T F S E K V G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
I G L P L W L P R G T V L R E Q L E Q F L R R A
- - - - - - - - - - - - L R E Q L E Q F L R R A
------------------------------------TTGCGCGAGCAGCTAGAACAGTTTTTACGTCGGGCC
289290291292293294295296297298299300301302303304305306307308309310311312
Q V K A G Y Q P V V T P H I G H K E L Y M T S G
Q V K A G Y Q P V V T P H I G - - - - - - - - -
CAGGTAAAAGCAGGCTACCAACCAGTAGTTACCCCTCACATAGGT---------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
H Y D K Y G E D S F Q P I R T P H E G E E F F L
- - - - - - - - - - - - - - - - - - - - - - F L
------------------------------------------------------------------TTCTTG
337338339340341342343344345346347348349350351352353354355356357358359360
K P M N C P H H C E I Y K H E P R S Y R D L P V
K P M N C P H H C - - - - - - - - - - - - - - V
AAACCTATGAATTGCCCCCACCATTGT------------------------------------------GTG
361362363364365366367368369370371372373374375376377378379380381382383384
R L A E F G T V Y R Y E Q H G E L H G L V R T R
R L A E F G T V Y R Y - - - - - - - - - - - - R
CGCTTGGCAGAATTTGGTACTGTGTATCGATAT------------------------------------AGG
385386387388389390391392393394395396397398399400401402403404405406407408
G F T Q D D A H I F C R N D Q V R E E F A K V I
G F T Q D D A H I F - - - - - - - - - F A K V I
GGCTTTACACAAGATGATGCGCACATATTT---------------------------TTTGCTAAAGTTATA
409410411412413414415416417418419420421422423424425426427428429430431432
D L V T Y V F S A L G F S D Y T A R L S F R D P
D L V T Y V F S - - - - - - - - - - - - - - - -
GACTTGGTAACTTATGTGTTTAGT------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E Q L H K Y I G D Q E D W D K A E E A I E E V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
K L R K L N T T K A L G E A A F Y G P K L D F M
- - - - - - - - - - - - - - - - - - - K L D F M
---------------------------------------------------------AAGTTAGATTTTATG
481482483484485486487488489490491492493494495496497498499500501502503504
V K D A L G R N W Q L G T V Q L D Y Q L P V R F
V - - - - - - - - Q L G T V Q L D - - - - - - -
GTG------------------------CAGCTTGGCACAGTACAGCTAGAT---------------------
505506507508509510511512513514515516517518519520521522523524525526527528
D L S Y T G A D N K K H R P V M I H R A P F G S
- - - - - - - - - - - - - P V M I H R A P . . S
---------------------------------------CCTGTAATGATTCATAGAGCACCC------TCA
529530531532533534535536537538539540541542543544545546547548549550551552
L E R F I A I L L E H T A G K L P L W L A P E Q
L E R F I A I - - - - - - - - - - - - - - - - -
TTAGAGCGATTTATTGCTATA---------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V A I L P I S E K F A A Y A E E V N Q N L R N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
D I R C F I D H R D E K I G K K I R E A E L S K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I P Y M F I I G E K E Q L E R T V S V R K Q G A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644
G D Q G S F P I D K L V Q E I V E D I S
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Bacteria/Deinococcus radiodurans/amino acid sequences/Dradiodurans_thr_aa
Bacteria/Deinococcus radiodurans/nucleotide sequences/Dradiodurans_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M H V T L P D G K Q L D L Q P G A T A L D A A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
A I G P R L A Q D A L G A T A N G E L T D L M T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
P L S D G A S I T L I T K K N P G D A A P L F R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
H S L G H V M S Q A V G E Y Y K A K G Y G P D A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
I K R G V G P Y I E N G W Y Q D F D L P E P L K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E E D L P E I E K I M R D I I G R G L D I T R R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E I S K D E A L A Q F P H D P Y K A E L I E G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P D D E P I T F Y S Q G D Y T D L C R G P H F P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S T G K L P Q S F K L M S T S G A Y W R G N E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
N P I L Q R I Y G V A F A T Q K E L D E Y L F Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
L E E A K R R D H R K L G K E L E L F T I D P L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
V G K G L P L W L P N G T V L R E E L T N F M K
- - - - - - - - - - - - - - L R E E L T N F M K
------------------------------------------CTCGTAGCGGTACACCGTGCCGAACTCGGC
289290291292293294295296297298299300301302303304305306307308309310311312
E Q Q F Q R G Y Q G V V T P N I G N L D L Y R T
E Q Q F Q R G Y Q G V V T P N I G - - - - - - -
CAGCCGCACCGGCAGGTCGCGGTAGCTGCGCGGCTTGCTGGCGTAAATTCG---------------------
313314315316317318319320321322323324325326327328329330331332333334335336
S G H Y P Y Y S E S Q F N P I Q V D E E E Y M L
- - - - - - - - - - - - - - - - - - - - - - M L
------------------------------------------------------------------GTAGTG
337338339340341342343344345346347348349350351352353354355356357358359360
K P M N C P H H V R I Y A S K P R S Y R D L P V
K P M N C P H H V - - - - - - - - - - - - - - V
CCCGGAGGTGCGGTACAGGTCGAGGTT------------------------------------------CTG
361362363364365366367368369370371372373374375376377378379380381382383384
R L A E F G T V Y R Y E Q S G E L N G L T R V R
R L A E F G T V Y R Y - - - - - - - - - - - - R
CTGCTCTTTCATGAAGTTGGTCAGCTCTTCGCG------------------------------------CTT
385386387388389390391392393394395396397398399400401402403404405406407408
G F T Q D D A H I F C R P D Q L K R E F L D V L
G F T Q D D A H I F - - - - - - - - - F L D V L
GCCCACCAGCGGGTCGATGGTGAACAGTTC---------------------------GCGCCGCTTGGCTTC
409410411412413414415416417418419420421422423424425426427428429430431432
D L T V L V L K T F G M T D V R F R V G V R D P
D L T V L V L K - - - - - - - - - - - - - - - -
TTCGAGCTGAAACAGGTACTCGTC------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
E S D K Y V G D E Q N W A L A E R Q I I E A V E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E V G L P Y T I E P G D A A F Y G P K L D F V V
- - - - - - - - - - - - - - - - - - K L D F V V
------------------------------------------------------GAAGGTGATGGGTTCGTC
481482483484485486487488489490491492493494495496497498499500501502503504
K D V L G R E W Q L G T I Q V D Y N L P E R F D
- - - - - - - - Q L G T I Q V D - - - - - - - -
------------------------AGCCTTGTAGGGGTCGTGGGGAAA------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
I S Y T G E D G Q E H R P I M I H R A P F G S I
- - - - - - - - - - - - P I M I H R A P . . S I
------------------------------------GATGTCGCGCATGATCTTTTCGAT------CAGGTC
529530531532533534535536537538539540541542543544545546547548549550551552
E R F T G I L I E H Y A G D F P L W L A P R Q V
E R F T G I - - - - - - - - - - - - - - - - - -
CTCTTCTTTCAGCGGCTC------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
M I I P I A D R H N A Y A E E L R E E L H R A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
L R A E V D D S S N R M Q A K V R D A E L H K I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
P V M L I V G D K E Q E A R E V S V R E R T G E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
G T K E R K G V K F D E L K A E L L E R R K N R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649
S
-
---
Class II
Eukaryotes/Giardia lamblia/amino acid sequences/Glamblia_thr_aa
Eukaryotes/Giardia lamblia/nucleotide sequences/Glamblia_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M P D F V T E R L A K F N A L R E R H A A S Q P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
T G G P F T V T L P D G K T T E I P A S F T A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
D V A K Q V V K N K K V Y S K F L A A V R D D E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
V I D M S A R L G K T C K L E F L T F D D P R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R E V F W H S S A H L L G Y A L E K T F Q A H L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
G H G P A I D S G F F Y D A F F E N S L K M E P
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E S L L Q L D K A A A E I V K Q A A A A P G D S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
P V R R F T R L E V T K Q E A L D L F S Y S K L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K S E L I S D H V Q D G E M C S V Y Q C G D F V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
D F C R G P H I P D L G L I Q A F K C M Y S S A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
A Y F K G D Q N R E S M Q R V Y A V A F P S K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
Q L D K H I E L L E E A K R R D H R N L A K E M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D L F M T H K Y A P G A P M F M N N G T R I Y R
- - - - - - - - - - - - - - - - - - - - - I Y R
---------------------------------------------------------------ATCTACCGC
313314315316317318319320321322323324325326327328329330331332333334335336
K L E A F I R E L L H E F D Y E E V M T P T F L
K L E A F I R E L L H E F D Y E E V M T P T F L
AAGCTCGAAGCTTTTATTCGCGAGCTCCTCCATGAGTTTGATTATGAAGAGGTCATGACACCGACGTTTCTC
337338339340341342343344345346347348349350351352353354355356357358359360
N T D L W G I S G H L Q H Y K E N M F L L E R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
E K T D P Q Y G L K P M N C P C H C L L Y K N Q
- - - - - - - G L K P M N C P C H C - - - - - -
---------------------GGTCTGAAACCCATGAACTGTCCGTGTCACTGT------------------
385386387388389390391392393394395396397398399400401402403404405406407408
H H S V Q E L P I R M A E F G V V H R N E L S G
- - - - - - - - I R M A E F G V V H R N - - - -
------------------------ATACGGATGGCAGAGTTTGGAGTTGTGCACCGCAAT------------
409410411412413414415416417418419420421422423424425426427428429430431432
A L S G L T R V V R F E Q D D A H I F C T V D Q
- - - - - - - - V R F E Q D D A H I F - - - - -
------------------------GTGCGTTTTGAGCAAGATGATGCACACATTTTC---------------
433434435436437438439440441442443444445446447448449450451452453454455456
I E Q E M T G L I E F I K R V Y T P F G I D F A
- - - - M T G L I E F I K R V Y T - - - - - - -
------------ATGACTGGCTTGATCGAATTTATCAAACGCGTTTATACA---------------------
457458459460461462463464465466467468469470471472473474475476477478479480
L S L S L R P E K K M G S D E L W D R A E G T L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
R K V L T N T G L D F K E N P G D G A F Y G P K
- - - - - - - - - - - - - - - - - - - - - - - K
---------------------------------------------------------------------AAG
505506507508509510511512513514515516517518519520521522523524525526527528
I D V H L T D A L G R Q H Q C G T I Q L D F N L
I D V H L - - - - - - - - Q C G T I Q L D - - -
ATTGATGTCCATCTA------------------------CAGTGCGGTACCATTCAGCTTGAC---------
529530531532533534535536537538539540541542543544545546547548549550551552
P S K D R F D L L Y S V Y D E K T G S V K Q E H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
P V M I H R A I L G S V E R F M A I L I E N T G
P V M I H R A I . . S V E R F M A I - - - - - -
CCAGTGATGATTCATAGGGCTATC------TCCGTTGAGCGCTTCATGGCCATC------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G R F P F W I S P R Q I V V I P L H G E D I V A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
Y A K T V R E R Y H S K G Y F V D L D I S S E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
M E K K I A V A W N K K Y N F I M V V G A Q E K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
G T C S V A L S G R T L S A Y I G E K D N Q R A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695
R K V L T L E E T D A L L A E L S S G R A N M
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Eukaryotes/Dictyostelium discoideum/amino acid sequences/Ddiscoideum_thr_aa
Eukaryotes/Dictyostelium discoideum/nucleotide sequences/Ddiscoideum_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S F L K L T K S I Q K I N N F N N N K I N L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
N K Y F S T T N I N N S G G G G N I K L N D G R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
I F K F E D K Q T P L T I A N K I N K T I G K Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
S I L S R L N G N K L I S M K E I I E M S G K D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
Y N I E F L N F E E H S D A R I C F W N S S S L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
V L A R A T M E Y F K N E N K E I E L I N F G H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
L V N P Q T A D N I N Q G T F Y I D I F F K D K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
N Q T I K D N D I N K I K K I M E Y I V K R N D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K F E I L K N D Q Q D Q D Q D Q E E S F I K F G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
E F K F K N N F L T I D S S N S I V S L D L I K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
N S S V V G P N K E Y S E L Q R I V G I S F P S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
K D Q M N N W V E I Q K I A A L R D H R V I G K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
D Q E L F F F H P F S P G S C F F L P H G T K I
- - - - - - - - - - - - - - - - - - - - - - - I
---------------------------------------------------------------------TTT
313314315316317318319320321322323324325326327328329330331332333334335336
Y N K L L Q F L R L E Y R K R G Y Q E V I S P N
Y N K L L Q F L R L E Y R K R G Y Q E V I S P N
ATAACTACGTGCTCTATGAGCATACATTAAACAATGGCCCGGACAATTCATTGGTTTTAAAGAGTATTGAGT
337338339340341342343344345346347348349350351352353354355356357358359360
I Y N Q K L W E T S G H W D N Y K D N M F S F E
I Y - - - - - - - - - - - - - - - - - - - - - -
ATGATC------------------------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
C D H T Q Y S L K P M N C P G H C L M Y A H R A
- - - - - - S L K P M N C P G H C - - - - - - -
------------------TATAACTTCTTGATAACCACGTTTACGATATTC---------------------
385386387388389390391392393394395396397398399400401402403404405406407408
R S Y K E L P M R I A D F G V L H R N E T H G S
- - - - - - - M R I A D F G V L H R N - - - - -
---------------------ATGTGGTAAAAAGAAACAACTACCAGGACTAAATGG---------------
409410411412413414415416417418419420421422423424425426427428429430431432
L S G L T R V R R F Q Q D D A H I F C T P D M I
- - - - - - - R R F Q Q D D A H I F - - - - - -
---------------------TCTATGATCACGTAATGCTGCAATCTTTTGAAT------------------
433434435436437438439440441442443444445446447448449450451452453454455456
R E E I K Q C L D F M K Y V Y T I F N F T F H L
- - - I K Q C L D F M K Y V Y T - - - - - - - -
---------ACTTGGGAATGAAATACCAACAATACGTTGAAGTTCTGA------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
E L S T R P D S Y L G E L S V W E K A E T S L S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Q V L T E F C G D K W T I N H G D G A F Y G P K
- - - - - - - - - - - - - - - - - - - - - - - K
---------------------------------------------------------------------AAT
505506507508509510511512513514515516517518519520521522523524525526527528
I D I H L K D A N G K N H Q C A T I Q L D F Q L
I D I H L - - - - - - - - Q C A T I Q L D - - -
TTCAAATTTATCATT------------------------TTTTTTAATTTTATTTATATCATT---------
529530531532533534535536537538539540541542543544545546547548549550551552
P I R F N L E Y S G G L N N N N N N N N N N E E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
I N D N N N N N S L N R P V M I H R A L F G S V
- - - - - - - - - - - - P V M I H R A L . . S V
------------------------------------TTTATTTTCATTTTTAAAATATTC------TGCACG
577578579580581582583584585586587588589590591592593594595596597598599600
E R M M A I L M E H T A G K W P F W L S P R Q C
E R M M A I - - - - - - - - - - - - - - - - - -
TGCCAATACTAATGAACT------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
I V I P V S N K F N Q F A Q E I Q S K I N L A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
Y D V D V D L N D S K L L S K K I R E A T V S Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
Y N Y I I V V G Q E E I D T N I L N V R K R D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
673674675676677678679680681682683684685686687688689690691692693694695696
P E D N K Q V K L S L N D L F S E F K L N I E Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
697698
F K
- -
------
Class II
Eukaryotes/Leishmania infantum/amino acid sequences/Linfantum_thr_aa
Eukaryotes/Leishmania infantum/nucleotide sequences/Linfantum_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M S G K K K A A E A T V D L A T L A E P G F W R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
Q R V E I F E Q L W Q Q Q Q N R Y E S M K A P I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
K V S L P D G K V M D A E S W V T C P L D I A K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
R L S N S L P D K V I V A R V N E A L W D L T R
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
P F E A D C Q L E L L D W D E K D A R E V F W H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
S S S H V L G Y A L E R I F D T K L S V G P A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
E E G G F F Y E G L T N R P V S E S D Y K A I E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
S A M Q E L V K Q K M P Y Q R L E V S K E D A L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
R L F G Y T E F K S K I L A S K V P D G G S C T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
V Y R C G M L I D P C R G P H L P D T G R V K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F A V T K N S S S Y L E G K A E N E V L Q R V Y
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G I S F P K N P M L T E W K T I Q E E A A K R D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
289290291292293294295296297298299300301302303304305306307308309310311312
H R V I G R Q Q N L F N F H E V S P G S A F W L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
P H G A R I Y N T L V E F L R K K Y R R C G F Q
- - - - - I Y N T L V E F L R K K Y R R C G F Q
---------------ATCTACAACACTCTCGTAGAATTCCTGCGCAAGAAGTATCGCCGCTGCGGCTTTCAG
337338339340341342343344345346347348349350351352353354355356357358359360
E V I S P N M Y S S K L W M V S G H W E K Y A D
E V I S P N M Y - - - - - - - - - - - - - - - -
GAGGTCATCTCGCCGAACATGTAC------------------------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
N M F C T K C E K E D F G L K P M N C P G H C I
- - - - - - - - - - - - G L K P M N C P G H C -
------------------------------------GGTCTGAAGCCGATGAACTGCCCGGGCCACTGC---
385386387388389390391392393394395396397398399400401402403404405406407408
M F A S Q P H S Y K E L P I R Y A D F G V L H R
- - - - - - - - - - - - - I R Y A D F G V L H R
---------------------------------------ATTCGCTACGCCGACTTTGGCGTGCTGCACCGG
409410411412413414415416417418419420421422423424425426427428429430431432
N E L S G A L T G L T R V R R F Q Q D D A H I F
N - - - - - - - - - - - - R R F Q Q D D A H I F
AAC------------------------------------CGCCGCTTCCAGCAGGACGATGCACACATCTTC
433434435436437438439440441442443444445446447448449450451452453454455456
C R M D Q I T D E M E G Q M Q F L S D V Y G V L
- - - - - - - - - M E G Q M Q F L S D V Y G - -
---------------------------ATGGAGGGCCAGATGCAGTTCCTCAGCGACGTTTACGGC------
457458459460461462463464465466467468469470471472473474475476477478479480
G F K F Y F Y H S T R P A N K L G S E A L W D Q
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
S E S Y L R T A L N R F C G I P E E L P D P L H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
P D Q R F H Y D G K P D S V K K M K A L M K K A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
E R C E D P N A W K G P T N G G D G W I E N A G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
D G A F Y G P K I D I V V E D A L R R R H Q C A
- - - - - - - K I D I V V - - - - - - - - Q C A
---------------------AAGATCGACATCGTCGTC------------------------CAGTGCGCC
577578579580581582583584585586587588589590591592593594595596597598599600
T I Q L D F N L P S R F G L K Y T L P A A E K D
T I Q L D - - - - - - - - - - - - - - - - - - -
ACGATCCAGTTGGAC---------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
E T T V S P T E K Q K H A D P A L T A S S P A V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628629630631632633634635636637638639640641642643644645646647648
E D C V S K P K P G T Y E A A V R D L G I D L E
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
649650651652653654655656657658659660661662663664665666667668669670671672
L D A N Q A R P V M I H R A I L G S L E R S I A
- - - - - - - P V M I H R A I . . S L E R S I A
---------------------CCCGTCATGATCCACCGCGCCATT------TCCTTGGAGCGCTCGATCGCC
673674675676677678679680681682683684685686687688689690691692693694695696
I L C E H F G G D W P F W L S P R Q V M V V P V
I - - - - - - - - - - - - - - - - - - - - - - -
ATT---------------------------------------------------------------------
697698699700701702703704705706707708709710711712713714715716717718719720
S A S N Y E Y S Q Q V R D T M H D A G F H A D V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
721722723724725726727728729730731732733734735736737738739740741742743744
D N G A A T L D K K I R N A E K A R Y N F I L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
745746747748749750751752753754755756757758759760761762763764765766767768
V G Q K E Q D A T A V N I R A R G E K R L G N K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
769770771772773774775776777778779780781782783784785786787788
S L V E A V Q W L K E L A D T H N R E Y
- - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------
Class II
Eukaryotes/Paulinella chromatophora/amino acid sequences/Pchromatophora_thr_aa
Eukaryotes/Paulinella chromatophora/nucleotide sequences/Pchromatophora_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M D N S T D S V K Q N T M E L L K T S E S P Q L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
L K I R H S M S H V M A M A V Q K L F P N A Q I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T I G P W T E S G F Y Y D F D N P E P F T E A D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
L K S I K K G M I K I I N Q N L N F E R V E V T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
R Q D V A C R I K A Q N E P Y K L E I L A G L I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
E P I T I Y K L G E Q W W D L C A G P H V N N T
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N E L N P K A F D L E S V A G S Y W R G D E K K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
A K L Q R I Y G T A W E T P E Q L E E Y K R R K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
K E A L R R D H R R L G T D L D L F S I E D E A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
G S G L V F W H P N G A R I R L L I E D F W R Q
- - - - - - - - - - - - - I R L L I E D F W R Q
---------------------------------------GAAATCAAAAGCCGATAGGATACGTTCGGTTAA
241242243244245246247248249250251252253254255256257258259260261262263264
S H L E A G Y E L L Y T P H I A D I R L W K T S
S H L E A G Y E L L Y T P H I A - - - - - - - -
ATTCAATACTTCTAAAACTTCACTTCCTATTTGCTCTGGCAAACAAAA------------------------
265266267268269270271272273274275276277278279280281282283284285286287288
G H L D F Y S E S M F S P M Q V D E R E Y Q L K
- - - - - - - - - - - - - - - - - - - - - Q L K
---------------------------------------------------------------CTCAGCCCA
289290291292293294295296297298299300301302303304305306307308309310311312
P M N C P F H V L T Y A S K L R S Y R E L P I R
P M N C P F H V - - - - - - - - - - - - - - I R
CCGTATGGGTAGTTCACGGTAAGA------------------------------------------CATCGG
313314315316317318319320321322323324325326327328329330331332333334335336
W A E L G T V Y R Y E R P G V M H G L M R V R G
W A E L G T V Y R Y - - - - - - - - - - - - R G
CTTGAGTTGGTACTCTCGTTCATCGACTTG------------------------------------ATGTCC
337338339340341342343344345346347348349350351352353354355356357358359360
F T Q D D A H I F C L P E Q I G S E V L E V L N
F T Q D D A H I F - - - - - - - - - V L E V L N
TGACGTTTTCCAAAGACGAATATCCGC---------------------------ACCAGCTTCTAGGTGAGA
361362363364365366367368369370371372373374375376377378379380381382383384
L T E R I L S A F D F T K Y E I N L S T R P E K
L T E R I L S - - - - - - - - - - - - - - - - -
TTGGCGCCAGAAATCTTCAAT---------------------------------------------------
385386387388389390391392393394395396397398399400401402403404405406407408
F I G G D D V W D L A T N G L V E A L N A K N W
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
N Y K I D E G G G A F Y G P K I D L K I K D A I
- - - - - - - - - - - - - - K I D L K I - - - -
------------------------------------------AGCAGTTCCATAAATACG------------
433434435436437438439440441442443444445446447448449450451452453454455456
G R T W Q C S T I Q L D F N L P E R F N I E Y V
- - - - Q C S T I Q L D - - - - - - - - - - - -
------------GCCACGCCAATATGAACCAGCTAC------------------------------------
457458459460461462463464465466467468469470471472473474475476477478479480
G S D G S R Q R P I M I H R A I F G S L E R F F
- - - - - - - - P I M I H R A I . . S L E R F F
------------------------GCAAAGATCCCACCATTGTTCTCC------GTAAATAGTAATTGGTTC
481482483484485486487488489490491492493494495496497498499500501502503504
G V M I E S C A G D F P F W L A P E Q I R L L P
G V - - - - - - - - - - - - - - - - - - - - - -
GATAAG------------------------------------------------------------------
505506507508509510511512513514515516517518519520521522523524525526527528
V T D E V I T Y A E E L L S Q L K I A G V R A S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
I D R T G D R L G K L I R N G E Q K K I P I L A
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
V V G A K E A E V G G A S L R S R Y E G E L G L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599
V N A Y N L V Q T A T L A N C K Q N S R F S L
- - - - - - - - - - - - - - - - - - - - - - -
---------------------------------------------------------------------
Class II
Eukaryotes/Nosema ceranae/amino acid sequences/Nceranae_thr_aa
Eukaryotes/Nosema ceranae/nucleotide sequences/Nceranae_thr_nuc
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
M L N I F F D K K V Y K V E E N I S A H D F L V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
E N T N L E N I M I C K I D G V L S D L S T C L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72
T A D C K L S F H S F D E C K D I F W H S S A H
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96
I L G N A L V N L Y P S C K L I N G P P I E E G
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
97 98 99 100101102103104105106107108109110111112113114115116117118119120
F F Y D I D I D T P L S Q E D Y K N I E S E F K
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
121122123124125126127128129130131132133134135136137138139140141142143144
K I V K K N Y K Y E K V Y Y S K A D L Q K M Y V
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
145146147148149150151152153154155156157158159160161162163164165166167168
N N K Y K L H F V N T K V E H G S T V Y K N G D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
169170171172173174175176177178179180181182183184185186187188189190191192
F Y D L C Q G P H I P S T G L V K S V K I L K N
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
193194195196197198199200201202203204205206207208209210211212213214215216
S S V H H N D K Q V Q R I Y A I S F P N K D L M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
217218219220221222223224225226227228229230231232233234235236237238239240
S K Y L K M R D E A I K K D H R K L G R E L D L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
241242243244245246247248249250251252253254255256257258259260261262263264
F F F H E Y S P G S C F F L P N G T F L Y N K L
- - - - - - - - - - - - - - - - - - - L Y N K L
---------------------------------------------------------ATGTGCATCATCCTG
265266267268269270271272273274275276277278279280281282283284285286287288
C D L M R S E Y L K R G F Q E V I T P N I F S I
C D L M R S E Y L K R G F Q E V I T P N I F - -
TTGAAATCTTCTAACACGTGTCAGTCCTGTAAGTGCACCACTTAACTCATTTCTATGTAAAACACC------
289290291292293294295296297298299300301302303304305306307308309310311312
E L W K E S G H Y E N Y K D N I F M L E N E N M
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
313314315316317318319320321322323324325326327328329330331332333334335336
A M K P M N C P G H C L M F K N V D H S F R D L
A M K P M N C P G H C - - - - - - - - - - - - -
CATCGGTTTCATAGCCATATTTTCATTTTCTAA---------------------------------------
337338339340341342343344345346347348349350351352353354355356357358359360
P I R Y A D F G V L H R N E L S G A L T G L T R
- I R Y A D F G V L H R N - - - - - - - - - - -
---TTTCCATAACTCAATACTAAAAATATTTGGTGTTAT---------------------------------
361362363364365366367368369370371372373374375376377378379380381382383384
V R R F Q Q D D A H I F C T K E Q V K E E I S N
- R R F Q Q D D A H I F - - - - - - - - - I S N
---CATTAAATCACACAACTTGTTGTATAAAAAAGT---------------------------AGGAGAATA
385386387388389390391392393394395396397398399400401402403404405406407408
C L D F L K H I Y G I F N F Q F G L F L S T R P
C L D F L K H I Y G - - - - - - - - - - - - - -
TTCATGAAAAAAGAAAAGGTCTAATTCTCT------------------------------------------
409410411412413414415416417418419420421422423424425426427428429430431432
D K F I G E I E E W D L A E K A L E L A I R E S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
433434435436437438439440441442443444445446447448449450451452453454455456
N L N Y T L N E G D G A F Y G P K I D I I L Q D
- - - - - - - - - - - - - - - - K I D I I L - -
------------------------------------------------AGTAGAAGGAATGTGTGG------
457458459460461462463464465466467468469470471472473474475476477478479480
A L G R R I Q C G T I Q L D F Q L P Q R F K L K
- - - - - - Q C G T I Q L D - - - - - - - - - -
------------------TCCATTTTTATAAACAGTAGAACC------------------------------
481482483484485486487488489490491492493494495496497498499500501502503504
Y R N N D G N Q N T P V I I H R A I L G S V E R
- - - - - - - - - - P V I I H R A I . . S V E R
------------------------------TAAATCTGCCTTAGAATAATATAC------ATATTTATAGTT
505506507508509510511512513514515516517518519520521522523524525526527528
F I A I L I E S Y G K K L P F W L N P R Q I G I
F I A I - - - - - - - - - - - - - - - - - - - -
CTTTTTAACAAT------------------------------------------------------------
529530531532533534535536537538539540541542543544545546547548549550551552
V S L A D E K Y T E K V K D Y F K S F R C E V L
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
553554555556557558559560561562563564565566567568569570571572573574575576
R D N N T I N K N L K I L I N K A Y Y F V C V I
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
577578579580581582583584585586587588589590591592593594595596597598599600
G N K E A E K N T I N V R I N N N Q I E Y S L D
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
601602603604605606607608609610611612613614615616617618619620621622623624
D F K S I L S K L E E D K K E Y E D L S K E F S
- - - - - - - - - - - - - - - - - - - - - - - -
------------------------------------------------------------------------
625626627628
N L K I
- - - -
------------